framework,version,device,op_name,kernel_source,moe_dtype,num_tokens,hidden_size,inter_size,topk,num_experts,moe_tp_size,moe_ep_size,distribution,latency
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,1,balanced,0.025994665920734406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,1,balanced,0.027450665831565857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,1,power_law_1.01,0.025248000025749208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,1,power_law_1.01,0.025593599677085875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,1,power_law_1.2,0.023014399409294128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,1,power_law_1.2,0.024166400730609893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,128,balanced,0.02314666658639908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,128,balanced,0.02510400116443634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,128,power_law_1.01,0.02181120067834854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,128,power_law_1.01,0.02336000055074692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,128,power_law_1.2,0.021804800629615782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,128,power_law_1.2,0.022387200593948366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,16,balanced,0.023082666099071503
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,16,balanced,0.02348266790310542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,16,power_law_1.01,0.023680000007152556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,16,power_law_1.01,0.025171199440956117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,16,power_law_1.2,0.023481599986553192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,16,power_law_1.2,0.024223999679088594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,2,balanced,0.023845332364241283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,2,balanced,0.025349333882331848
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,2,power_law_1.01,0.02420479953289032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,2,power_law_1.01,0.025491198897361754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,2,power_law_1.2,0.024172799289226533
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,2,power_law_1.2,0.02436479926109314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,32,balanced,0.024373332659403484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,32,balanced,0.025061334172884624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,32,power_law_1.01,0.02295680046081543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,32,power_law_1.01,0.023737600445747374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,32,power_law_1.2,0.02111999988555908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,32,power_law_1.2,0.02260479927062988
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,4,balanced,0.023472001155217487
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,4,balanced,0.02367999901374181
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,4,power_law_1.01,0.02399359941482544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,4,power_law_1.01,0.0255295991897583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,4,power_law_1.2,0.023014399409294128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,4,power_law_1.2,0.02311040014028549
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,64,balanced,0.023472001155217487
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,64,balanced,0.02526933451493581
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,64,power_law_1.01,0.021792000532150267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,64,power_law_1.01,0.023763200640678404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,64,power_law_1.2,0.021670399606227873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,64,power_law_1.2,0.021932800114154816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,8,balanced,0.023141334454218548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,8,balanced,0.02327999969323476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,8,power_law_1.01,0.023391999304294586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,8,power_law_1.01,0.023481599986553192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,8,power_law_1.2,0.025248000025749208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,1,8,power_law_1.2,0.025279998779296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,2,1,balanced,0.02510400116443634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,2,1,balanced,0.02535466601451238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,2,1,power_law_1.01,0.023814399540424348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,2,1,power_law_1.01,0.02462719976902008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,2,1,power_law_1.2,0.02279680073261261
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,2,1,power_law_1.2,0.023449599742889404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,4,1,balanced,0.023520000278949738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,4,1,balanced,0.024517332514127094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,4,1,power_law_1.01,0.0219200000166893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,4,1,power_law_1.01,0.022720000147819518
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,4,1,power_law_1.2,0.02250880002975464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,2048,768,8,128,4,1,power_law_1.2,0.022758400440216063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,1,balanced,0.031045332551002502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,1,balanced,0.03186666717131933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,1,power_law_1.01,0.028275200724601747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,1,power_law_1.01,0.028441599011421202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,1,power_law_1.2,0.02810240089893341
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,1,power_law_1.2,0.029120001196861266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,128,balanced,0.023797333240509033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,128,balanced,0.025055999557177227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,128,power_law_1.01,0.022937600314617158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,128,power_law_1.01,0.02338559925556183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,128,power_law_1.2,0.02284799963235855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,128,power_law_1.2,0.023104000091552734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,16,balanced,0.025445332129796345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,16,balanced,0.025461333493391674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,16,power_law_1.01,0.02928000092506409
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,16,power_law_1.01,0.030131199955940248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,16,power_law_1.2,0.029868799448013305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,16,power_law_1.2,0.030105599761009218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,2,balanced,0.027434666951497395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,2,balanced,0.02743999908367793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,2,power_law_1.01,0.029139199852943422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,2,power_law_1.01,0.03033599853515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,2,power_law_1.2,0.028832000494003297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,2,power_law_1.2,0.02884480059146881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,256,balanced,0.02720000098148982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,256,balanced,0.027263998985290527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,256,power_law_1.01,0.023763200640678404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,256,power_law_1.2,0.02247679978609085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,256,power_law_1.2,0.023609599471092223
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,32,balanced,0.02625600000222524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,32,balanced,0.02754666656255722
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,32,power_law_1.01,0.02818560004234314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,32,power_law_1.01,0.03020800054073334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,32,power_law_1.2,0.028825598955154418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,32,power_law_1.2,0.028863999247550964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,4,balanced,0.026575999955336254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,4,balanced,0.027402666707833607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,4,power_law_1.01,0.028415998816490172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,4,power_law_1.01,0.029209598898887634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,4,power_law_1.2,0.030003198981285097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,4,power_law_1.2,0.03017599880695343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,64,balanced,0.023397333920001984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,64,balanced,0.025050667424996693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,64,power_law_1.01,0.024076800048351287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,64,power_law_1.01,0.026208001375198364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,64,power_law_1.2,0.024780799448490144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,64,power_law_1.2,0.02508159875869751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,8,balanced,0.02531733363866806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,8,balanced,0.02649066597223282
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,8,power_law_1.01,0.02969599962234497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,8,power_law_1.01,0.030131199955940248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,8,power_law_1.2,0.029356798529624938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,1,8,power_law_1.2,0.02974080145359039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,2,1,balanced,0.02717866748571396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,2,1,balanced,0.02738133321205775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,2,1,power_law_1.01,0.024160000681877136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,2,1,power_law_1.01,0.027635198831558228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,2,1,power_law_1.2,0.025279998779296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,2,1,power_law_1.2,0.02584959864616394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,4,1,balanced,0.025285333395004272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,4,1,balanced,0.02536533276240031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,4,1,power_law_1.01,0.023948800563812257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,4,1,power_law_1.01,0.024396799504756927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,4,1,power_law_1.2,0.02398719936609268
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,4,1,power_law_1.2,0.026796799898147584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,8,1,balanced,0.025008000433444977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,8,1,balanced,0.02516266703605652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,8,1,power_law_1.01,0.02388480007648468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,8,1,power_law_1.01,0.02632960081100464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,8,1,power_law_1.2,0.02398719936609268
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,3072,1536,8,256,8,1,power_law_1.2,0.026368001103401185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,1,balanced,0.060458665092786155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,1,balanced,0.06052800019582113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,1,power_law_1.01,0.05738880038261414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,1,power_law_1.01,0.05749120116233826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,1,power_law_1.2,0.05668479800224304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,1,power_law_1.2,0.05688959956169128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,2,balanced,0.04246933261553446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,2,balanced,0.04460800190766653
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,2,power_law_1.01,0.04966399967670441
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,2,power_law_1.01,0.050918400287628174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,2,power_law_1.2,0.049932798743247984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,2,power_law_1.2,0.052665597200393675
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,4,balanced,0.03921599934498469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,4,balanced,0.04018666595220566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,4,power_law_1.01,0.04119040071964264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,4,power_law_1.01,0.04583680033683777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,4,power_law_1.2,0.04149760007858276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,4,power_law_1.2,0.044012799859046936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,8,balanced,0.04188799858093262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,8,balanced,0.0466186652580897
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,8,power_law_1.01,0.03986560106277466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,8,power_law_1.01,0.041894400119781496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,8,power_law_1.2,0.03939839899539947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,1,8,power_law_1.2,0.042284798622131345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,16,1,balanced,0.02548266698916753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,16,1,balanced,0.026837334036827087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,16,1,power_law_1.01,0.023839999735355378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,16,1,power_law_1.01,0.025964799523353576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,16,1,power_law_1.2,0.024038399755954742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,16,1,power_law_1.2,0.024281600117683412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,2,1,balanced,0.037674665451049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,2,1,balanced,0.040463998913764954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,2,1,power_law_1.01,0.04175359904766083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,2,1,power_law_1.01,0.04195199906826019
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,2,1,power_law_1.2,0.03850879967212677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,2,1,power_law_1.2,0.040006399154663086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,32,1,balanced,0.023391999304294586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,32,1,balanced,0.027189334233601887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,32,1,power_law_1.01,0.02328319996595383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,32,1,power_law_1.01,0.02526719868183136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,32,1,power_law_1.2,0.023923200368881226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,32,1,power_law_1.2,0.025171199440956117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,4,1,balanced,0.027674667537212372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,4,1,balanced,0.02943466603755951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,4,1,power_law_1.01,0.02871040105819702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,4,1,power_law_1.01,0.030822399258613586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,4,1,power_law_1.2,0.02940160036087036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,4,1,power_law_1.2,0.030483201146125793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,8,1,balanced,0.025744001070658367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,8,1,balanced,0.026133333643277485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,8,1,power_law_1.01,0.025766399502754212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,8,1,power_law_1.01,0.026041600108146667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,8,1,power_law_1.2,0.02388480007648468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,14336,2,8,8,1,power_law_1.2,0.02640640139579773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,1,balanced,0.03364799916744232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,1,balanced,0.03578133384386698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,1,power_law_1.01,0.030342400074005127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,1,power_law_1.01,0.03252480030059814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,1,power_law_1.2,0.030483201146125793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,1,power_law_1.2,0.031219199299812317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,128,balanced,0.025397333006064098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,128,balanced,0.027445333699385326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,128,power_law_1.01,0.025516799092292784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,128,power_law_1.01,0.0255295991897583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,128,power_law_1.2,0.024281600117683412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,128,power_law_1.2,0.02566399872303009
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,16,balanced,0.02569599946339925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,16,balanced,0.026154667139053345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,16,power_law_1.01,0.031200000643730165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,16,power_law_1.01,0.032179200649261476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,16,power_law_1.2,0.03258239924907684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,16,power_law_1.2,0.03298560082912445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,2,balanced,0.027488000690937042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,2,balanced,0.029743999242782593
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,2,power_law_1.01,0.030144000053405763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,2,power_law_1.01,0.03358719944953918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,2,power_law_1.2,0.031564798951148984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,2,power_law_1.2,0.031615999341011045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,32,balanced,0.02516799916823705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,32,balanced,0.02548266698916753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,32,power_law_1.01,0.024889600276947022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,32,power_law_1.01,0.025216001272201537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,32,power_law_1.2,0.024915200471878052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,32,power_law_1.2,0.025119999051094057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,4,balanced,0.02719466636578242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,4,balanced,0.02740799884001414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,4,power_law_1.01,0.031219199299812317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,4,power_law_1.01,0.03276160061359405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,4,power_law_1.2,0.03091199994087219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,4,power_law_1.2,0.03358719944953918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,64,balanced,0.025013332565625507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,64,balanced,0.02722666660944621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,64,power_law_1.01,0.023846399784088135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,64,power_law_1.01,0.02550399899482727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,64,power_law_1.2,0.02391680032014847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,64,power_law_1.2,0.025433599948883057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,8,balanced,0.02625600000222524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,8,balanced,0.027514666318893433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,8,power_law_1.01,0.029631999135017396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,8,power_law_1.01,0.030163198709487915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,8,power_law_1.2,0.03306879997253418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,1,8,power_law_1.2,0.03308799862861633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,2,1,balanced,0.029333333174387615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,2,1,balanced,0.02938666691382726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,2,1,power_law_1.01,0.027526399493217467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,2,1,power_law_1.01,0.028198400139808656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,2,1,power_law_1.2,0.026291200518608095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,2,1,power_law_1.2,0.02632960081100464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,4,1,balanced,0.02550933261712392
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,4,1,balanced,0.02735466758410136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,4,1,power_law_1.01,0.024383999407291412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,4,1,power_law_1.01,0.02505599856376648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,4,1,power_law_1.2,0.024710400402545928
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,4,1,power_law_1.2,0.026752001047134398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,8,1,balanced,0.025418666501839954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,8,1,balanced,0.027445333699385326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,8,1,power_law_1.01,0.026374399662017822
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,8,1,power_law_1.01,0.026444798707962035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,8,1,power_law_1.2,0.024537600576877594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,4096,1536,8,128,8,1,power_law_1.2,0.02632319927215576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,1,balanced,0.07817600170771281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,1,balanced,0.07843199868996938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,1,power_law_1.01,0.07647359967231751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,1,power_law_1.01,0.07656959891319275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,1,power_law_1.2,0.07500159740447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,1,power_law_1.2,0.07667840123176575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,2,balanced,0.05533333122730255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,2,balanced,0.058133333921432495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,2,power_law_1.01,0.053465598821640016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,2,power_law_1.01,0.06233599781990051
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,2,power_law_1.2,0.05782399773597717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,2,power_law_1.2,0.06416640281677247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,4,balanced,0.05518933137257894
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,4,balanced,0.055493334929148354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,4,power_law_1.01,0.05400959849357605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,4,power_law_1.01,0.05492479801177978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,4,power_law_1.2,0.05516160130500793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,4,power_law_1.2,0.05991680026054382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,8,balanced,0.05499733487764994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,8,balanced,0.05602133274078369
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,8,power_law_1.01,0.05304960012435913
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,8,power_law_1.01,0.05427200198173523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,8,power_law_1.2,0.052985602617263795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,1,8,power_law_1.2,0.05487359762191772
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,16,1,balanced,0.02571733295917511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,16,1,balanced,0.026261332134405773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,16,1,power_law_1.01,0.02568959891796112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,16,1,power_law_1.01,0.025843200087547303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,16,1,power_law_1.2,0.025548800826072693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,16,1,power_law_1.2,0.02720000147819519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,2,1,balanced,0.05201066533724467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,2,1,balanced,0.05401599903901418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,2,1,power_law_1.01,0.052262401580810545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,2,1,power_law_1.01,0.05235199928283692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,2,1,power_law_1.2,0.050457602739334105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,2,1,power_law_1.2,0.051635199785232545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,32,1,balanced,0.025424001117547352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,32,1,balanced,0.027855999767780304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,32,1,power_law_1.01,0.025964799523353576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,32,1,power_law_1.01,0.026643198728561402
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,32,1,power_law_1.2,0.02451840043067932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,32,1,power_law_1.2,0.02460159957408905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,4,1,balanced,0.032431999842325844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,4,1,balanced,0.0335413341720899
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,4,1,power_law_1.01,0.034995201230049136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,4,1,power_law_1.01,0.036025598645210266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,4,1,power_law_1.2,0.03505280017852783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,4,1,power_law_1.2,0.03527039885520935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,8,1,balanced,0.029296000798543293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,8,1,balanced,0.03001066545645396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,8,1,power_law_1.01,0.027551999688148497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,8,1,power_law_1.01,0.029523199796676634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,8,1,power_law_1.2,0.027654400467872618
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,16384,2,8,8,1,power_law_1.2,0.03023360073566437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,1,balanced,0.05390933156013489
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,1,balanced,0.054746667544047035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,1,power_law_1.01,0.050809597969055174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,1,power_law_1.01,0.052172797918319705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,1,power_law_1.2,0.05253120064735413
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,1,power_law_1.2,0.052665597200393675
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,128,balanced,0.02735466758410136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,128,balanced,0.027429332335789997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,128,power_law_1.01,0.025843200087547303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,128,power_law_1.01,0.02768639922142029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,128,power_law_1.2,0.02573440074920654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,128,power_law_1.2,0.026169601082801818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,16,balanced,0.029498666524887085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,16,balanced,0.029616000751654308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,16,power_law_1.01,0.050809597969055174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,16,power_law_1.01,0.05248000025749207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,16,power_law_1.2,0.052134400606155394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,16,power_law_1.2,0.05231999754905701
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,2,balanced,0.03317866722742716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,2,balanced,0.033914667864640556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,2,power_law_1.01,0.051641601324081424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,2,power_law_1.01,0.053286397457122804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,2,power_law_1.2,0.052172797918319705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,2,power_law_1.2,0.05233280062675476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,256,balanced,0.027322667340437572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,256,balanced,0.0276053324341774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,256,power_law_1.01,0.02571519911289215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,256,power_law_1.01,0.027321600914001466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,256,power_law_1.2,0.0255295991897583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,32,balanced,0.029109333952267964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,32,balanced,0.029258665939172108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,32,power_law_1.01,0.051660799980163576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,32,power_law_1.01,0.05233280062675476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,32,power_law_1.2,0.051526397466659546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,32,power_law_1.2,0.052799999713897705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,4,balanced,0.029504001140594482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,4,balanced,0.02956266701221466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,4,power_law_1.01,0.05225600004196167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,4,power_law_1.01,0.05268480181694031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,4,power_law_1.2,0.05160319805145264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,4,power_law_1.2,0.05200639963150024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,64,balanced,0.0271573339899381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,64,balanced,0.029146666328112285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,64,power_law_1.01,0.031251201033592226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,64,power_law_1.01,0.03175680041313171
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,64,power_law_1.2,0.03157120048999786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,64,power_law_1.2,0.033055999875068666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,8,balanced,0.029343999922275543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,8,balanced,0.02958400050799052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,8,power_law_1.01,0.051667201519012454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,8,power_law_1.01,0.05256320238113403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,8,power_law_1.2,0.05135359764099121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,1,8,power_law_1.2,0.05191680192947388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,16,1,balanced,0.02740799884001414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,16,1,balanced,0.028186666468779247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,16,1,power_law_1.01,0.02655999958515167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,16,1,power_law_1.01,0.026681599020957947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,16,1,power_law_1.2,0.026815998554229736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,16,1,power_law_1.2,0.027635198831558228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,2,1,balanced,0.03316266586383184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,2,1,balanced,0.03357866654793421
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,2,1,power_law_1.01,0.030291199684143066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,2,1,power_law_1.01,0.030316799879074097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,2,1,power_law_1.2,0.030118399858474733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,2,1,power_law_1.2,0.03282560110092163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,32,1,balanced,0.027845333019892376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,32,1,balanced,0.027994667490323383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,32,1,power_law_1.01,0.025996801257133485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,32,1,power_law_1.01,0.02624639868736267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,32,1,power_law_1.2,0.02560639977455139
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,32,1,power_law_1.2,0.026399999856948853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,4,1,balanced,0.030608000854651134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,4,1,balanced,0.03126399964094162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,4,1,power_law_1.01,0.027238398790359497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,4,1,power_law_1.01,0.027609598636627198
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,4,1,power_law_1.2,0.02739199995994568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,4,1,power_law_1.2,0.027603200078010558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,8,1,balanced,0.027386667827765148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,8,1,balanced,0.029653333127498627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,8,1,power_law_1.01,0.02645759880542755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,8,1,power_law_1.01,0.02815999984741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,8,1,power_law_1.2,0.02675839960575104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2048,8,256,8,1,power_law_1.2,0.026918399333953857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,1,balanced,0.05996266504128774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,1,balanced,0.061247999469439186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,1,power_law_1.01,0.05785599946975708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,1,power_law_1.01,0.060224002599716185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,1,power_law_1.2,0.059468799829483034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,1,power_law_1.2,0.059654402732849124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,16,balanced,0.029290666182835896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,16,balanced,0.029578665892283123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,16,power_law_1.01,0.05969280004501343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,16,power_law_1.01,0.06059520244598389
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,16,power_law_1.2,0.05976960062980652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,16,power_law_1.2,0.06036480069160462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,2,balanced,0.041797334949175514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,2,balanced,0.04358399907747904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,2,power_law_1.01,0.05921919941902161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,2,power_law_1.01,0.06007680296897888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,2,power_law_1.2,0.0595583975315094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,2,power_law_1.2,0.05999360084533691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,32,balanced,0.029445332785447437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,32,balanced,0.029861333469549816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,32,power_law_1.01,0.04690560102462769
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,32,power_law_1.01,0.04780159890651703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,32,power_law_1.2,0.046009600162506104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,32,power_law_1.2,0.04707840085029602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,4,balanced,0.029146666328112285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,4,balanced,0.029477333029111225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,4,power_law_1.01,0.0585919976234436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,4,power_law_1.01,0.06004480123519897
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,4,power_law_1.2,0.05914239883422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,4,power_law_1.2,0.059724801778793336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,8,balanced,0.027744000156720478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,8,balanced,0.029493334392706554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,8,power_law_1.01,0.05971199870109558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,8,power_law_1.01,0.06046079993247986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,8,power_law_1.2,0.05875200033187866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,1,8,power_law_1.2,0.06040319800376892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,2,1,balanced,0.03984000037113825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,2,1,balanced,0.043920000394185386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,2,1,power_law_1.01,0.04270080029964447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,2,1,power_law_1.01,0.04286080002784729
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,2,1,power_law_1.2,0.041145598888397215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,2,1,power_law_1.2,0.041555199027061465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,4,1,balanced,0.02961066613594691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,4,1,balanced,0.030533333619435627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,4,1,power_law_1.01,0.02869119942188263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,4,1,power_law_1.01,0.028723201155662535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,4,1,power_law_1.2,0.028255999088287354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,4,1,power_law_1.2,0.02873600125312805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,8,1,balanced,0.028192001084486645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,8,1,balanced,0.0286613330245018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,8,1,power_law_1.01,0.026521599292755126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,8,1,power_law_1.01,0.026713600754737853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,8,1,power_law_1.2,0.026662400364875792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,6144,2560,8,160,8,1,power_law_1.2,0.027084800601005554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,1,balanced,0.05770133435726166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,1,balanced,0.057850668827692665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,1,power_law_1.01,0.054118400812149046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,1,power_law_1.01,0.05674239993095398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,1,power_law_1.2,0.05424000024795532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,1,power_law_1.2,0.05694720149040222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,128,balanced,0.02938133229811986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,128,balanced,0.02951466788848241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,128,power_law_1.01,0.027091199159622194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,128,power_law_1.01,0.02781440019607544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,128,power_law_1.2,0.026547199487686156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,128,power_law_1.2,0.028672000765800475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,16,balanced,0.02939733366171519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,16,balanced,0.03054400036732356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,16,power_law_1.01,0.055769598484039305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,16,power_law_1.01,0.05704960227012634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,16,power_law_1.2,0.05555840134620667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,16,power_law_1.2,0.057132798433303836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,2,balanced,0.03760000069936117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,2,balanced,0.03887466589609782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,2,power_law_1.01,0.056377601623535153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,2,power_law_1.01,0.05719040036201477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,2,power_law_1.2,0.054425597190856934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,2,power_law_1.2,0.056569600105285646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,256,balanced,0.027535999814669292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,256,balanced,0.027679999669392902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,256,power_law_1.01,0.02632319927215576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,256,power_law_1.01,0.027910399436950683
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,256,power_law_1.2,0.026969599723815917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,256,power_law_1.2,0.027961599826812743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,32,balanced,0.029530666768550873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,32,balanced,0.029557332396507263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,32,power_law_1.01,0.05532159805297852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,32,power_law_1.01,0.056831997632980344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,32,power_law_1.2,0.05594879984855652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,32,power_law_1.2,0.05626879930496216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,4,balanced,0.029557332396507263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,4,balanced,0.031290667752424874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,4,power_law_1.01,0.05651199817657471
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,4,power_law_1.01,0.05729280114173889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,4,power_law_1.2,0.05625600218772888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,4,power_law_1.2,0.05648639798164368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,64,balanced,0.02938666691382726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,64,balanced,0.029631999631722767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,64,power_law_1.01,0.03592959940433502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,64,power_law_1.01,0.036339199542999266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,64,power_law_1.2,0.03558399975299835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,64,power_law_1.2,0.036723199486732486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,8,balanced,0.029493334392706554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,8,balanced,0.029701332251230877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,8,power_law_1.01,0.05607039928436279
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,8,power_law_1.01,0.05677440166473389
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,8,power_law_1.2,0.055244797468185426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,1,8,power_law_1.2,0.05690240263938904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,16,1,balanced,0.029370665550231934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,16,1,balanced,0.02943466603755951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,16,1,power_law_1.01,0.027609598636627198
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,16,1,power_law_1.01,0.029049599170684816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,16,1,power_law_1.2,0.026918399333953857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,16,1,power_law_1.2,0.02943359911441803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,2,1,balanced,0.037605332831541695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,2,1,balanced,0.03976000100374222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,2,1,power_law_1.01,0.03442560136318207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,2,1,power_law_1.01,0.036959999799728395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,2,1,power_law_1.2,0.034860798716545106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,2,1,power_law_1.2,0.03610239923000336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,32,1,balanced,0.029317334294319153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,32,1,balanced,0.031258667508761086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,32,1,power_law_1.01,0.027871999144554137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,32,1,power_law_1.01,0.029286399483680725
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,32,1,power_law_1.2,0.0268095999956131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,32,1,power_law_1.2,0.027091199159622194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,4,1,balanced,0.02934933453798294
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,4,1,balanced,0.03142933299144109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,4,1,power_law_1.01,0.029235199093818665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,4,1,power_law_1.01,0.031167998909950256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,4,1,power_law_1.2,0.027551999688148497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,4,1,power_law_1.2,0.027980801463127137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,8,1,balanced,0.029520000020662945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,8,1,balanced,0.031258667508761086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,8,1,power_law_1.01,0.027276799082756042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,8,1,power_law_1.01,0.028307199478149414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,8,1,power_law_1.2,0.027353599667549133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,256,8,1,power_law_1.2,0.028531199693679808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,1,balanced,0.058037335673967995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,1,balanced,0.0581279993057251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,1,power_law_1.01,0.05608320236206055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,1,power_law_1.01,0.05626239776611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,1,power_law_1.2,0.05594879984855652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,1,power_law_1.2,0.05667200088500977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,128,balanced,0.027466667195161183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,128,balanced,0.029552000264326733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,128,power_law_1.01,0.028300800919532777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,128,power_law_1.01,0.028889599442481994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,128,power_law_1.2,0.02874239981174469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,128,power_law_1.2,0.02945919930934906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,16,balanced,0.029205332199732464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,16,balanced,0.031008000175158184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,16,power_law_1.01,0.05497599840164184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,16,power_law_1.01,0.05621119737625122
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,16,power_law_1.2,0.05472000241279602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,16,power_law_1.2,0.05583999752998352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,2,balanced,0.035487999518712364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,2,balanced,0.037776000797748566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,2,power_law_1.01,0.05616000294685364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,2,power_law_1.01,0.05658239722251892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,2,power_law_1.2,0.05500800013542175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,2,power_law_1.2,0.056601601839065555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,32,balanced,0.02975466599067052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,32,balanced,0.03145600110292435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,32,power_law_1.01,0.055622398853302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,32,power_law_1.01,0.05626879930496216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,32,power_law_1.2,0.05537279844284058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,32,power_law_1.2,0.056524801254272464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,4,balanced,0.029557332396507263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,4,balanced,0.02959466725587845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,4,power_law_1.01,0.05616000294685364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,4,power_law_1.01,0.056627202033996585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,4,power_law_1.2,0.05617280006408691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,4,power_law_1.2,0.0574400007724762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,64,balanced,0.029520000020662945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,64,balanced,0.03125333289305369
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,64,power_law_1.01,0.05055360198020935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,64,power_law_1.01,0.0506816029548645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,64,power_law_1.2,0.050367999076843264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,64,power_law_1.2,0.050400000810623166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,8,balanced,0.030938667555650074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,8,balanced,0.03136000037193298
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,8,power_law_1.01,0.05583999752998352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,8,power_law_1.01,0.05661439895629883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,8,power_law_1.2,0.05609599947929382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,1,8,power_law_1.2,0.056377601623535153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,16,1,balanced,0.02937600016593933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,16,1,balanced,0.029487999776999157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,16,1,power_law_1.01,0.027225598692893982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,16,1,power_law_1.01,0.02813439965248108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,16,1,power_law_1.2,0.02895359992980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,16,1,power_law_1.2,0.029260799288749695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,2,1,balanced,0.03451200077931086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,2,1,balanced,0.0390079990029335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,2,1,power_law_1.01,0.03561600148677826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,2,1,power_law_1.01,0.036364799737930296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,2,1,power_law_1.2,0.03692800104618073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,2,1,power_law_1.2,0.03842560052871704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,32,1,balanced,0.029530666768550873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,32,1,balanced,0.03139200061559677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,32,1,power_law_1.01,0.026982399821281432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,32,1,power_law_1.01,0.027276799082756042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,32,1,power_law_1.2,0.02720000147819519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,32,1,power_law_1.2,0.027577599883079527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,4,1,balanced,0.029722665747006733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,4,1,balanced,0.03138133386770884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,4,1,power_law_1.01,0.028012800216674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,4,1,power_law_1.01,0.02874239981174469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,4,1,power_law_1.2,0.027968001365661622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,4,1,power_law_1.2,0.02956799864768982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,8,1,balanced,0.029317334294319153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,8,1,balanced,0.029530666768550873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,8,1,power_law_1.01,0.02802560031414032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,8,1,power_law_1.01,0.028563201427459717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,8,1,power_law_1.2,0.027878400683403016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1,7168,2048,8,384,8,1,power_law_1.2,0.02922239899635315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,1,balanced,0.1156160036722819
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,1,balanced,0.11582400401433308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,1,power_law_1.01,0.13129600286483764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,1,power_law_1.01,0.13325439691543578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,1,power_law_1.2,0.13352320194244385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,1,power_law_1.2,0.1368384003639221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,128,balanced,0.0417546679576238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,128,balanced,0.04197333256403605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,128,power_law_1.01,0.04105600118637085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,128,power_law_1.01,0.041247999668121337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,128,power_law_1.2,0.040479999780654904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,128,power_law_1.2,0.041606399416923526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,16,balanced,0.04354666670163473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,16,balanced,0.043605332573254905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,16,power_law_1.01,0.045824000239372255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,16,power_law_1.01,0.04602240025997162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,16,power_law_1.2,0.04679679870605469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,16,power_law_1.2,0.046937599778175354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,2,balanced,0.07273600002129872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,2,balanced,0.07406933108965556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,2,power_law_1.01,0.08222079873085023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,2,power_law_1.01,0.08365439772605895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,2,power_law_1.2,0.08561919927597046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,2,power_law_1.2,0.08767359852790832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,32,balanced,0.04275733232498169
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,32,balanced,0.04365866879622141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,32,power_law_1.01,0.04311679899692535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,32,power_law_1.01,0.043584001064300534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,32,power_law_1.2,0.04296959936618805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,32,power_law_1.2,0.0430976003408432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,4,balanced,0.06277333199977875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,4,balanced,0.06295466423034668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,4,power_law_1.01,0.06855040192604064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,4,power_law_1.01,0.07217919826507568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,4,power_law_1.2,0.06969599723815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,4,power_law_1.2,0.0717311978340149
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,64,balanced,0.04168533285458883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,64,balanced,0.04261333247025808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,64,power_law_1.01,0.041222399473190306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,64,power_law_1.01,0.041715198755264284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,64,power_law_1.2,0.041945600509643556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,64,power_law_1.2,0.04225279986858368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,8,balanced,0.04823466638724009
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,8,balanced,0.04879466692606608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,8,power_law_1.01,0.05172479748725891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,8,power_law_1.01,0.052876800298690796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,8,power_law_1.2,0.05315840244293213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,1,8,power_law_1.2,0.05345919728279114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,2,1,balanced,0.0867680013179779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,2,1,balanced,0.0888426701227824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,2,1,power_law_1.01,0.09527680277824402
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,2,1,power_law_1.01,0.0961471974849701
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,2,1,power_law_1.2,0.09565439820289612
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,2,1,power_law_1.2,0.09590399861335755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,4,1,balanced,0.07206400235493977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,4,1,balanced,0.07333866755167644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,4,1,power_law_1.01,0.0763647973537445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,4,1,power_law_1.01,0.07708160281181335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,4,1,power_law_1.2,0.0772159993648529
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,2048,768,8,128,4,1,power_law_1.2,0.07727360129356384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,1,balanced,0.3794826666514079
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,1,balanced,0.38092267513275146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,1,power_law_1.01,0.4460288047790527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,1,power_law_1.01,0.4493696212768555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,1,power_law_1.2,0.46895999908447267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,1,power_law_1.2,0.4706240177154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,128,balanced,0.0476800004641215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,128,balanced,0.048122664292653404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,128,power_law_1.01,0.04643200039863586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,128,power_law_1.01,0.04717440009117126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,128,power_law_1.2,0.04713599979877472
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,128,power_law_1.2,0.04723840057849884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,16,balanced,0.07332266867160797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,16,balanced,0.0735093355178833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,16,power_law_1.01,0.07457919716835022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,16,power_law_1.01,0.07500159740447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,16,power_law_1.2,0.07642239928245545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,16,power_law_1.2,0.07857279777526856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,2,balanced,0.19609065850575766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,2,balanced,0.19653334220250449
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,2,power_law_1.01,0.21304960250854493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,2,power_law_1.01,0.21349759101867677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,2,power_law_1.2,0.22367360591888427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,2,power_law_1.2,0.2247488021850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,256,balanced,0.04800533254941305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,256,balanced,0.04801600178082784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,256,power_law_1.01,0.04618239998817444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,256,power_law_1.01,0.04624640047550201
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,256,power_law_1.2,0.046163201332092285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,256,power_law_1.2,0.04647040069103241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,32,balanced,0.05820799867312113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,32,balanced,0.058245331048965454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,32,power_law_1.01,0.057548797130584715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,32,power_law_1.01,0.059308797121047974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,32,power_law_1.2,0.059494400024414064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,32,power_law_1.2,0.060121601819992064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,4,balanced,0.12608533104260763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,4,balanced,0.12657066186269125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,4,power_law_1.01,0.12674560546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,4,power_law_1.01,0.13014400005340576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,4,power_law_1.2,0.1291584014892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,4,power_law_1.2,0.1375488042831421
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,64,balanced,0.0497920016447703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,64,balanced,0.05004799862702688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,64,power_law_1.01,0.04888319969177246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,64,power_law_1.01,0.05058559775352478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,64,power_law_1.2,0.05093119740486145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,64,power_law_1.2,0.05182719826698303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,8,balanced,0.12435733278592427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,8,balanced,0.1246560017267863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,8,power_law_1.01,0.10485119819641113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,8,power_law_1.01,0.11333119869232178
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,8,power_law_1.2,0.10975359678268433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,1,8,power_law_1.2,0.1119488000869751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,2,1,balanced,0.2365493377049764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,2,1,balanced,0.23809599876403809
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,2,1,power_law_1.01,0.2703039884567261
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,2,1,power_law_1.01,0.27302401065826415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,2,1,power_law_1.2,0.2814143896102905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,2,1,power_law_1.2,0.2840192079544067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,4,1,balanced,0.15847466389338175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,4,1,balanced,0.1593706707159678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,4,1,power_law_1.01,0.1709887981414795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,4,1,power_law_1.01,0.1739967942237854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,4,1,power_law_1.2,0.17701120376586915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,4,1,power_law_1.2,0.17827199697494506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,8,1,balanced,0.1288479963938395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,8,1,balanced,0.12944533427556357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,8,1,power_law_1.01,0.1372480034828186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,8,1,power_law_1.01,0.13729920387268066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,8,1,power_law_1.2,0.13896960020065308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,3072,1536,8,256,8,1,power_law_1.2,0.13931519985198976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,1,balanced,0.2702186703681946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,1,balanced,0.27024000883102417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,1,power_law_1.01,0.34664320945739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,1,power_law_1.01,0.4396671772003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,1,power_law_1.2,0.3183039903640747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,1,power_law_1.2,0.35552639961242677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,2,balanced,0.1623253325621287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,2,balanced,0.1637279987335205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,2,power_law_1.01,0.23512959480285645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,2,power_law_1.01,0.25683839321136476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,2,power_law_1.2,0.23877758979797364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,2,power_law_1.2,0.24242560863494872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,4,balanced,0.10895466804504395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,4,balanced,0.1113920013109843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,4,power_law_1.01,0.16361600160598755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,4,power_law_1.01,0.17489919662475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,4,power_law_1.2,0.16240639686584474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,4,power_law_1.2,0.17051520347595214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,8,balanced,0.08916800220807393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,8,balanced,0.0899733304977417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,8,power_law_1.01,0.14360320568084717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,8,power_law_1.01,0.15192960500717162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,8,power_law_1.2,0.144652795791626
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,1,8,power_law_1.2,0.1509119987487793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,16,1,balanced,0.06650666892528534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,16,1,balanced,0.06665599842866261
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,16,1,power_law_1.01,0.06707839965820313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,16,1,power_law_1.01,0.06855679750442505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,16,1,power_law_1.2,0.06836479902267456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,16,1,power_law_1.2,0.06926720142364502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,2,1,balanced,0.1606826682885488
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,2,1,balanced,0.1646399994691213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,2,1,power_law_1.01,0.20327680110931395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,2,1,power_law_1.01,0.22140800952911377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,2,1,power_law_1.2,0.18908159732818602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,2,1,power_law_1.2,0.2029184103012085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,32,1,balanced,0.055871998270352684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,32,1,balanced,0.057760000228881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,32,1,power_law_1.01,0.058847999572753905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,32,1,power_law_1.01,0.06197119951248169
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,32,1,power_law_1.2,0.05971840023994446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,32,1,power_law_1.2,0.06064640283584595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,4,1,balanced,0.11167466640472412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,4,1,balanced,0.11199999849001567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,4,1,power_law_1.01,0.1281599998474121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,4,1,power_law_1.01,0.13731199502944946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,4,1,power_law_1.2,0.1223680019378662
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,4,1,power_law_1.2,0.13075200319290162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,8,1,balanced,0.08429867029190063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,8,1,balanced,0.08438400427500407
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,8,1,power_law_1.01,0.08615679740905761
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,8,1,power_law_1.01,0.0887935996055603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,8,1,power_law_1.2,0.08766080141067505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,14336,2,8,8,1,power_law_1.2,0.0898751974105835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,1,balanced,0.3078933358192444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,1,balanced,0.308351993560791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,1,power_law_1.01,0.36338560581207274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,1,power_law_1.01,0.36791040897369387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,1,power_law_1.2,0.37695999145507814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,1,power_law_1.2,0.3809535980224609
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,128,balanced,0.05190933247407278
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,128,balanced,0.05197866757710775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,128,power_law_1.01,0.052313601970672606
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,128,power_law_1.01,0.05264639854431152
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,128,power_law_1.2,0.05300480127334595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,128,power_law_1.2,0.05479679703712463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,16,balanced,0.06913066903750102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,16,balanced,0.06980800131956737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,16,power_law_1.01,0.07500159740447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,16,power_law_1.01,0.07541120052337646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,16,power_law_1.2,0.07614719867706299
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,16,power_law_1.2,0.0779583990573883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,2,balanced,0.15934399763743082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,2,balanced,0.16049599647521973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,2,power_law_1.01,0.1880895972251892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,2,power_law_1.01,0.1901568055152893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,2,power_law_1.2,0.19601919651031494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,2,power_law_1.2,0.19838720560073853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,32,balanced,0.05414933462937673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,32,balanced,0.0552106648683548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,32,power_law_1.01,0.0610368013381958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,32,power_law_1.01,0.06288639903068542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,32,power_law_1.2,0.06218879818916321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,32,power_law_1.2,0.06347519755363465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,4,balanced,0.129530668258667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,4,balanced,0.13109866778055826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,4,power_law_1.01,0.1264575958251953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,4,power_law_1.01,0.13151999711990356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,4,power_law_1.2,0.1305408000946045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,4,power_law_1.2,0.13752319812774658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,64,balanced,0.05172266562779745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,64,balanced,0.052101333936055504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,64,power_law_1.01,0.053548800945281985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,64,power_law_1.01,0.0542464017868042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,64,power_law_1.2,0.05930240154266357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,64,power_law_1.2,0.0599232017993927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,8,balanced,0.08398399750391643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,8,balanced,0.08565333485603333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,8,power_law_1.01,0.08895360231399536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,8,power_law_1.01,0.0915391981601715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,8,power_law_1.2,0.09329280257225037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,1,8,power_law_1.2,0.09470080137252808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,2,1,balanced,0.19342933098475137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,2,1,balanced,0.19358932971954346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,2,1,power_law_1.01,0.22298240661621094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,2,1,power_law_1.01,0.22557439804077148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,2,1,power_law_1.2,0.23086719512939452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,2,1,power_law_1.2,0.23104639053344728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,4,1,balanced,0.1393119990825653
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,4,1,balanced,0.1397706667582194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,4,1,power_law_1.01,0.15385600328445434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,4,1,power_law_1.01,0.1542847990989685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,4,1,power_law_1.2,0.15605119466781617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,4,1,power_law_1.2,0.15873279571533203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,8,1,balanced,0.11458133657773335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,8,1,balanced,0.1153546671072642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,8,1,power_law_1.01,0.12109440565109253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,8,1,power_law_1.01,0.12129919528961182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,8,1,power_law_1.2,0.12055039405822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,4096,1536,8,128,8,1,power_law_1.2,0.12246400117874146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,1,balanced,0.4601759910583496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,1,balanced,0.46133331457773846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,1,power_law_1.01,0.5701439857482911
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,1,power_law_1.01,0.5890495777130127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,1,power_law_1.2,0.597273588180542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,1,power_law_1.2,0.632806396484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,2,balanced,0.25117866198221844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,2,balanced,0.25274133682250977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,2,power_law_1.01,0.4162623882293701
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,2,power_law_1.01,0.4324480056762695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,2,power_law_1.2,0.3694400072097778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,2,power_law_1.2,0.3843775987625122
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,4,balanced,0.16107199589411417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,4,balanced,0.16167466839154562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,4,power_law_1.01,0.27384960651397705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,4,power_law_1.01,0.2880703926086426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,4,power_law_1.2,0.258790397644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,4,power_law_1.2,0.26652801036834717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,8,balanced,0.11030399799346924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,8,balanced,0.11269866426785786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,8,power_law_1.01,0.2155071973800659
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,8,power_law_1.01,0.22004480361938478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,8,power_law_1.2,0.21767680644989013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,1,8,power_law_1.2,0.22904961109161376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,16,1,balanced,0.08476266264915466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,16,1,balanced,0.08490133285522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,16,1,power_law_1.01,0.09278720021247863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,16,1,power_law_1.01,0.09890559911727906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,16,1,power_law_1.2,0.09106559753417968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,16,1,power_law_1.2,0.09296000003814697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,2,1,balanced,0.23118933041890463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,2,1,balanced,0.23403199513753256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,2,1,power_law_1.01,0.3253376007080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,2,1,power_law_1.01,0.32666239738464353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,2,1,power_law_1.2,0.315993595123291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,2,1,power_law_1.2,0.3197695970535278
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,32,1,balanced,0.0745600014925003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,32,1,balanced,0.07457066575686137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,32,1,power_law_1.01,0.07857279777526856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,32,1,power_law_1.01,0.08011519908905029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,32,1,power_law_1.2,0.07798399925231933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,32,1,power_law_1.2,0.07953919768333435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,4,1,balanced,0.1474613348642985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,4,1,balanced,0.14800000190734863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,4,1,power_law_1.01,0.1794368028640747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,4,1,power_law_1.01,0.1904703974723816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,4,1,power_law_1.2,0.1704576015472412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,4,1,power_law_1.2,0.17363840341567993
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,8,1,balanced,0.10896000266075134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,8,1,balanced,0.11020800471305847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,8,1,power_law_1.01,0.12001279592514039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,8,1,power_law_1.01,0.12336640357971192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,8,1,power_law_1.2,0.11727360486984253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,16384,2,8,8,1,power_law_1.2,0.12825599908828736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,1,balanced,0.9404693444569906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,1,balanced,0.9456160068511963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,1,power_law_1.01,1.127295970916748
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,1,power_law_1.01,1.1343551635742188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,1,power_law_1.2,1.1907072067260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,1,power_law_1.2,1.1997568130493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,128,balanced,0.06198399762312571
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,128,balanced,0.06270933151245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,128,power_law_1.01,0.06636800169944763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,128,power_law_1.01,0.06816639900207519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,128,power_law_1.2,0.06884480118751526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,128,power_law_1.2,0.07331200242042542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,16,balanced,0.1267093320687612
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,16,balanced,0.12820266683896384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,16,power_law_1.01,0.12547839879989625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,16,power_law_1.01,0.1267840027809143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,16,power_law_1.2,0.12891520261764527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,16,power_law_1.2,0.130348801612854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,2,balanced,0.45371198654174805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,2,balanced,0.4549599885940552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,2,power_law_1.01,0.5089471817016602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,2,power_law_1.01,0.5186495780944824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,2,power_law_1.2,0.5316415786743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,2,power_law_1.2,0.5356287956237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,256,balanced,0.0603413333495458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,256,balanced,0.060421332716941833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,256,power_law_1.01,0.060140800476074216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,256,power_law_1.01,0.06080639958381653
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,256,power_law_1.2,0.061440002918243405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,256,power_law_1.2,0.06440320014953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,32,balanced,0.0929813285668691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,32,balanced,0.09435199697812398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,32,power_law_1.01,0.09737600088119507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,32,power_law_1.01,0.09802240133285522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,32,power_law_1.2,0.0980351984500885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,32,power_law_1.2,0.10321919918060303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,4,balanced,0.2677173415819804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,4,balanced,0.272213339805603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,4,power_law_1.01,0.27394559383392336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,4,power_law_1.01,0.27526400089263914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,4,power_law_1.2,0.28331520557403567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,4,power_law_1.2,0.29263360500335694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,64,balanced,0.07700266440709432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,64,balanced,0.07916800181070964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,64,power_law_1.01,0.08058879971504211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,64,power_law_1.01,0.08075519800186157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,64,power_law_1.2,0.08478080034255982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,64,power_law_1.2,0.08529919981956482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,8,balanced,0.22482667366663614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,8,balanced,0.2473599910736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,8,power_law_1.01,0.1816704034805298
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,8,power_law_1.01,0.19162240028381347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,8,power_law_1.2,0.2066431999206543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,1,8,power_law_1.2,0.23452160358428956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,16,1,balanced,0.19193067153294882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,16,1,balanced,0.1926400065422058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,16,1,power_law_1.01,0.20807039737701416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,16,1,power_law_1.01,0.2099839925765991
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,16,1,power_law_1.2,0.21479039192199706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,16,1,power_law_1.2,0.21544320583343507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,2,1,balanced,0.5131413141886393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,2,1,balanced,0.513322671254476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,2,1,power_law_1.01,0.5906047821044922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,2,1,power_law_1.01,0.596070384979248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,2,1,power_law_1.2,0.613702392578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,2,1,power_law_1.2,0.6240767955780029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,32,1,balanced,0.17528533935546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,32,1,balanced,0.1766773263613383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,32,1,power_law_1.01,0.19155839681625367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,32,1,power_law_1.01,0.1917248010635376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,32,1,power_law_1.2,0.19315199851989745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,32,1,power_law_1.2,0.19471360445022584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,4,1,balanced,0.31831467151641846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,4,1,balanced,0.31989866495132446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,4,1,power_law_1.01,0.3523583889007568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,4,1,power_law_1.01,0.3550976037979126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,4,1,power_law_1.2,0.3675328016281128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,4,1,power_law_1.2,0.36792960166931155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,8,1,balanced,0.22779200474421182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,8,1,balanced,0.22991466522216797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,8,1,power_law_1.01,0.24895360469818115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,8,1,power_law_1.01,0.2526911973953247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,8,1,power_law_1.2,0.2590399980545044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2048,8,256,8,1,power_law_1.2,0.259168004989624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,1,balanced,0.8126186529795328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,1,balanced,0.8208533128102621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,1,power_law_1.01,0.9091327667236329
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,1,power_law_1.01,0.9208512306213379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,1,power_law_1.2,0.9503744125366211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,1,power_law_1.2,0.950438404083252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,16,balanced,0.10883200168609619
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,16,balanced,0.1095413366953532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,16,power_law_1.01,0.11954560279846191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,16,power_law_1.01,0.12316160202026367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,16,power_law_1.2,0.12391040325164795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,16,power_law_1.2,0.12420480251312256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,2,balanced,0.3821226755777995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,2,balanced,0.38365864753723145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,2,power_law_1.01,0.4450496196746826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,2,power_law_1.01,0.4567232131958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,2,power_law_1.2,0.4674560070037842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,2,power_law_1.2,0.47064957618713377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,32,balanced,0.08745599786440532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,32,balanced,0.0899679958820343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,32,power_law_1.01,0.09490560293197632
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,32,power_law_1.01,0.0956928014755249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,32,power_law_1.2,0.09807999730110169
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,32,power_law_1.2,0.10138239860534667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,4,balanced,0.36826133728027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,4,balanced,0.375274658203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,4,power_law_1.01,0.2803967952728271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,4,power_law_1.01,0.3145983934402466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,4,power_law_1.2,0.3131903886795044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,4,power_law_1.2,0.3287872076034546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,8,balanced,0.15577066938082376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,8,balanced,0.1566933294137319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,8,power_law_1.01,0.17006080150604247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,8,power_law_1.01,0.17582080364227295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,8,power_law_1.2,0.1780608057975769
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,1,8,power_law_1.2,0.18029439449310303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,2,1,balanced,0.46320533752441406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,2,1,balanced,0.4642346700032552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,2,1,power_law_1.01,0.5103295803070068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,2,1,power_law_1.01,0.5104767799377441
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,2,1,power_law_1.2,0.5260543823242188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,2,1,power_law_1.2,0.5290624141693115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,4,1,balanced,0.29129600524902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,4,1,balanced,0.291866660118103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,4,1,power_law_1.01,0.31278719902038576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,4,1,power_law_1.01,0.31918718814849856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,4,1,power_law_1.2,0.3227008104324341
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,4,1,power_law_1.2,0.32332799434661863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,8,1,balanced,0.20154666900634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,8,1,balanced,0.2018666664759318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,8,1,power_law_1.01,0.2098560094833374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,8,1,power_law_1.01,0.2119488000869751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,8,1,power_law_1.2,0.2157952070236206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,6144,2560,8,160,8,1,power_law_1.2,0.2169663906097412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,1,balanced,1.100549300511678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,1,balanced,1.114847977956136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,1,power_law_1.01,1.3073344230651855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,1,power_law_1.01,1.3316032409667968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,1,power_law_1.2,1.3823488235473633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,1,power_law_1.2,1.387769603729248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,128,balanced,0.07070399820804596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,128,balanced,0.07121600210666656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,128,power_law_1.01,0.07367680072784424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,128,power_law_1.01,0.0741823971271515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,128,power_law_1.2,0.07654399871826172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,128,power_law_1.2,0.08076159954071045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,16,balanced,0.1365333298842112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,16,balanced,0.1383680005868276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,16,power_law_1.01,0.13793280124664306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,16,power_law_1.01,0.14168319702148438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,16,power_law_1.2,0.14240000247955323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,16,power_law_1.2,0.14595839977264405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,2,balanced,0.5263253450393677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,2,balanced,0.5270346800486246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,2,power_law_1.01,0.5916160106658935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,2,power_law_1.01,0.6086463928222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,2,power_law_1.2,0.6153471946716309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,2,power_law_1.2,0.6285312175750732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,256,balanced,0.06568533182144165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,256,balanced,0.06638399759928386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,256,power_law_1.01,0.06595199704170226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,256,power_law_1.01,0.06621440052986145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,256,power_law_1.2,0.06997759938240052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,256,power_law_1.2,0.07025279998779296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,32,balanced,0.10713066657384236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,32,balanced,0.11000000437100728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,32,power_law_1.01,0.1067199945449829
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,32,power_law_1.01,0.10750720500946045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,32,power_law_1.2,0.11157759428024291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,32,power_law_1.2,0.11179519891738891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,4,balanced,0.30792532364527386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,4,balanced,0.3094133337338765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,4,power_law_1.01,0.3182143926620483
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,4,power_law_1.01,0.3203392028808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,4,power_law_1.2,0.3425856113433838
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,4,power_law_1.2,0.34676480293273926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,64,balanced,0.08683733145395915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,64,balanced,0.08815466364224751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,64,power_law_1.01,0.08965759873390197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,64,power_law_1.01,0.09165440201759338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,64,power_law_1.2,0.09170560240745544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,64,power_law_1.2,0.09317759871482849
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,8,balanced,0.2469546596209208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,8,balanced,0.2739253242810567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,8,power_law_1.01,0.2271104097366333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,8,power_law_1.01,0.23900799751281737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,8,power_law_1.2,0.2511104106903076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,1,8,power_law_1.2,0.2521536111831665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,16,1,balanced,0.21837866306304932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,16,1,balanced,0.21853333711624146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,16,1,power_law_1.01,0.23931519985198973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,16,1,power_law_1.01,0.23957760334014894
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,16,1,power_law_1.2,0.24404480457305908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,16,1,power_law_1.2,0.24636800289154054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,2,1,balanced,0.5966933170954386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,2,1,balanced,0.5987840096155802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,2,1,power_law_1.01,0.6906239986419678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,2,1,power_law_1.01,0.6928575992584228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,2,1,power_law_1.2,0.7214528083801269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,2,1,power_law_1.2,0.727027177810669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,32,1,balanced,0.20016000668207803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,32,1,balanced,0.20098666350046793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,32,1,power_law_1.01,0.2179647922515869
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,32,1,power_law_1.01,0.2180095911026001
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,32,1,power_law_1.2,0.22069120407104492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,32,1,power_law_1.2,0.22222719192504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,4,1,balanced,0.3681600093841553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,4,1,balanced,0.3690026601155599
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,4,1,power_law_1.01,0.41011199951171873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,4,1,power_law_1.01,0.4111167907714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,4,1,power_law_1.2,0.42622718811035154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,4,1,power_law_1.2,0.43079681396484376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,8,1,balanced,0.2617866595586141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,8,1,balanced,0.2618773380915324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,8,1,power_law_1.01,0.2892672061920166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,8,1,power_law_1.01,0.2896640062332153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,8,1,power_law_1.2,0.2953216075897217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,256,8,1,power_law_1.2,0.29738240242004393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,1,balanced,1.5899786949157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,1,balanced,1.7343254089355469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,1,power_law_1.01,1.5385279655456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,1,power_law_1.01,1.5504639625549317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,1,power_law_1.2,1.6225408554077148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,1,power_law_1.2,1.6237503051757813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,128,balanced,0.07863466441631317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,128,balanced,0.07922133306662242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,128,power_law_1.01,0.07964800000190735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,128,power_law_1.01,0.08177279829978942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,128,power_law_1.2,0.08362240195274354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,128,power_law_1.2,0.0840511977672577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,16,balanced,0.17631999651590982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,16,balanced,0.1831093430519104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,16,power_law_1.01,0.16398080587387084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,16,power_law_1.01,0.1694208025932312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,16,power_law_1.2,0.16572799682617187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,16,power_law_1.2,0.17422720193862914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,2,balanced,0.7472693125406901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,2,balanced,0.7483786741892496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,2,power_law_1.01,0.704857587814331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,2,power_law_1.01,0.7411136150360107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,2,power_law_1.2,0.7433407783508301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,2,power_law_1.2,0.7544703960418702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,32,balanced,0.12184533476829529
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,32,balanced,0.1227946678797404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,32,power_law_1.01,0.11850880384445191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,32,power_law_1.01,0.12233599424362182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,32,power_law_1.2,0.12197120189666748
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,32,power_law_1.2,0.12503679990768432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,4,balanced,0.4776159922281901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,4,balanced,0.4790079991022746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,4,power_law_1.01,0.4023295879364014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,4,power_law_1.01,0.41385598182678224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,4,power_law_1.2,0.41527681350708007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,4,power_law_1.2,0.42539520263671876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,64,balanced,0.09878933429718018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,64,balanced,0.09929066896438599
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,64,power_law_1.01,0.09462400078773499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,64,power_law_1.01,0.0964735984802246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,64,power_law_1.2,0.09748479723930359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,64,power_law_1.2,0.09887359738349914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,8,balanced,0.5625120004018148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,8,balanced,0.5801173448562622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,8,power_law_1.01,0.35634560585021974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,8,power_law_1.01,0.36186239719390867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,8,power_law_1.2,0.3789439916610718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,1,8,power_law_1.2,0.3896512031555176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,16,1,balanced,0.2786986629168193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,16,1,balanced,0.28062933683395386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,16,1,power_law_1.01,0.26421759128570554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,16,1,power_law_1.01,0.2665343999862671
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,16,1,power_law_1.2,0.2724479913711548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,16,1,power_law_1.2,0.273523211479187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,2,1,balanced,0.8435946305592855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,2,1,balanced,0.8468586603800455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,2,1,power_law_1.01,0.8188480377197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,2,1,power_law_1.01,0.8220095634460449
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,2,1,power_law_1.2,0.8447296142578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,2,1,power_law_1.2,0.8511296272277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,32,1,balanced,0.24995734294255575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,32,1,balanced,0.2505439917246501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,32,1,power_law_1.01,0.23597440719604493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,32,1,power_law_1.01,0.23627519607543945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,32,1,power_law_1.2,0.2389120101928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,32,1,power_law_1.2,0.24196479320526124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,4,1,balanced,0.5007253487904867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,4,1,balanced,0.5014239947001139
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,4,1,power_law_1.01,0.46996479034423827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,4,1,power_law_1.01,0.47436161041259767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,4,1,power_law_1.2,0.48855037689208985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,4,1,power_law_1.2,0.4905983924865723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,8,1,balanced,0.3401120106379191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,8,1,balanced,0.3429493506749471
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,8,1,power_law_1.01,0.3212863922119141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,8,1,power_law_1.01,0.3239936113357544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,8,1,power_law_1.2,0.32982399463653567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1024,7168,2048,8,384,8,1,power_law_1.2,0.3327807903289795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,1,balanced,0.6249386469523112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,1,balanced,0.6324853499730428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,1,power_law_1.01,0.6692800045013427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,1,power_law_1.01,0.6797567844390869
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,1,power_law_1.2,0.6792191982269287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,1,power_law_1.2,0.679532814025879
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,128,balanced,0.15063466628392538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,128,balanced,0.1506613294283549
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,128,power_law_1.01,0.17553919553756714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,128,power_law_1.01,0.17867519855499267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,128,power_law_1.2,0.20315520763397216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,128,power_law_1.2,0.20453760623931885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,16,balanced,0.17467200756072998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,16,balanced,0.1749653418858846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,16,power_law_1.01,0.21950719356536866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,16,power_law_1.01,0.22446079254150392
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,16,power_law_1.2,0.23840000629425048
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,16,power_law_1.2,0.24790399074554442
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,2,balanced,0.3828959862391154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,2,balanced,0.38365332285563153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,2,power_law_1.01,0.4262527942657471
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,2,power_law_1.01,0.4422912120819092
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,2,power_law_1.2,0.438047981262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,2,power_law_1.2,0.45601282119750974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,32,balanced,0.15903466939926147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,32,balanced,0.16004799803098044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,32,power_law_1.01,0.20266880989074706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,32,power_law_1.01,0.2089087963104248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,32,power_law_1.2,0.21376640796661378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,32,power_law_1.2,0.2164223909378052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,4,balanced,0.26711465915044147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,4,balanced,0.2672586639722188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,4,power_law_1.01,0.3084800004959106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,4,power_law_1.01,0.3209151983261108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,4,power_law_1.2,0.3392640113830566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,4,power_law_1.2,0.3491519927978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,64,balanced,0.15241066614786783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,64,balanced,0.15318399667739868
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,64,power_law_1.01,0.18932479619979858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,64,power_law_1.01,0.18999680280685424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,64,power_law_1.2,0.19950079917907715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,64,power_law_1.2,0.20748798847198485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,8,balanced,0.20816532770792642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,8,balanced,0.2091360092163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,8,power_law_1.01,0.24909439086914062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,8,power_law_1.01,0.2604543924331665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,8,power_law_1.2,0.2589375972747803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,1,8,power_law_1.2,0.27841920852661134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,2,1,balanced,0.4621973435084025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,2,1,balanced,0.4639626741409302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,2,1,power_law_1.01,0.48156161308288575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,2,1,power_law_1.01,0.4836480140686035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,2,1,power_law_1.2,0.4849984169006348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,2,1,power_law_1.2,0.48786559104919436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,4,1,balanced,0.3981279929478963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,4,1,balanced,0.40170665582021076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,4,1,power_law_1.01,0.4138688087463379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,4,1,power_law_1.01,0.4150207996368408
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,4,1,power_law_1.2,0.41449599266052245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,2048,768,8,128,4,1,power_law_1.2,0.41785597801208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,1,balanced,1.182421366373698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,1,balanced,1.1952106952667236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,1,power_law_1.01,1.3674240112304688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,1,power_law_1.01,1.3727999687194825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,1,power_law_1.2,1.3905535697937013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,1,power_law_1.2,1.3942015647888184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,128,balanced,0.21278399229049683
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,128,balanced,0.21404266357421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,128,power_law_1.01,0.24680960178375244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,128,power_law_1.01,0.25576961040496826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,128,power_law_1.2,0.2778048038482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,128,power_law_1.2,0.2877952098846436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,16,balanced,0.26501866181691486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,16,balanced,0.26524800062179565
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,16,power_law_1.01,0.3312191963195801
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,16,power_law_1.01,0.337446403503418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,16,power_law_1.2,0.35107200145721434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,16,power_law_1.2,0.3692352056503296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,2,balanced,0.6770453453063965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,2,balanced,0.6793493429819742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,2,power_law_1.01,0.7946815967559815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,2,power_law_1.01,0.8238143920898438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,2,power_law_1.2,0.8400064468383789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,2,power_law_1.2,0.9425344467163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,256,balanced,0.21163199345270792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,256,balanced,0.21188799540201822
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,256,power_law_1.01,0.23548800945281984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,256,power_law_1.01,0.23827199935913085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,256,power_law_1.2,0.2636607885360718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,256,power_law_1.2,0.2763200044631958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,32,balanced,0.23298132419586182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,32,balanced,0.23431466023127237
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,32,power_law_1.01,0.2841536045074463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,32,power_law_1.01,0.2863615989685059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,32,power_law_1.2,0.3180927991867065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,32,power_law_1.2,0.32250878810882566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,4,balanced,0.4445066849390666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,4,balanced,0.44512001673380536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,4,power_law_1.01,0.5499328136444092
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,4,power_law_1.01,0.5610432147979736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,4,power_law_1.2,0.5759679794311523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,4,power_law_1.2,0.582316780090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,64,balanced,0.21799467007319132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,64,balanced,0.21860800186793009
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,64,power_law_1.01,0.2580928087234497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,64,power_law_1.01,0.2660799980163574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,64,power_law_1.2,0.2923264026641846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,64,power_law_1.2,0.2936896085739136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,8,balanced,0.3267359932263692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,8,balanced,0.3272213339805603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,8,power_law_1.01,0.3919680118560791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,8,power_law_1.01,0.4144447803497314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,8,power_law_1.2,0.43432960510253904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,1,8,power_law_1.2,0.45160961151123047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,2,1,balanced,0.7565013567606608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,2,1,balanced,0.7598293622334799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,2,1,power_law_1.01,0.8640192031860352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,2,1,power_law_1.01,0.8663935661315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,2,1,power_law_1.2,0.8771455764770508
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,2,1,power_law_1.2,0.8821887969970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,4,1,balanced,0.5724853277206421
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,4,1,balanced,0.573797345161438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,4,1,power_law_1.01,0.6427519798278809
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,4,1,power_law_1.01,0.6469632148742676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,4,1,power_law_1.2,0.6537600040435791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,4,1,power_law_1.2,0.6545983791351319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,8,1,balanced,0.5097226699193319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,8,1,balanced,0.5102719863255819
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,8,1,power_law_1.01,0.5603583812713623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,8,1,power_law_1.01,0.5615871906280517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,8,1,power_law_1.2,0.5682432174682617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,3072,1536,8,256,8,1,power_law_1.2,0.570246410369873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,1,balanced,2.497978687286377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,1,balanced,2.581914742787679
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,1,power_law_1.01,2.5321088790893556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,1,power_law_1.01,2.537894439697266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,1,power_law_1.2,2.538483238220215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,1,power_law_1.2,2.543436813354492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,2,balanced,1.3237280050913494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,2,balanced,1.3480213483174641
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,2,power_law_1.01,1.6908031463623048
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,2,power_law_1.01,1.9814016342163085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,2,power_law_1.2,1.8679935455322265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,2,power_law_1.2,1.869081687927246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,4,balanced,0.7828693389892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,4,balanced,0.7841386795043945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,4,power_law_1.01,1.4116928100585937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,4,power_law_1.01,1.7762239456176758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,4,power_law_1.2,1.4464447975158692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,4,power_law_1.2,1.4688063621520997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,8,balanced,0.5121119817097982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,8,balanced,0.5127413272857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,8,power_law_1.01,1.2536767959594726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,8,power_law_1.01,1.2744640350341796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,8,power_law_1.2,1.1832575798034668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,1,8,power_law_1.2,1.24902400970459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,16,1,balanced,0.4224693377812703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,16,1,balanced,0.423306663831075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,16,1,power_law_1.01,0.42225279808044436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,16,1,power_law_1.01,0.4240128040313721
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,16,1,power_law_1.2,0.42278399467468264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,16,1,power_law_1.2,0.4233664035797119
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,2,1,balanced,1.3338665962219238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,2,1,balanced,1.333957354227702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,2,1,power_law_1.01,1.361894416809082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,2,1,power_law_1.01,1.3673600196838378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,2,1,power_law_1.2,1.367347240447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,2,1,power_law_1.2,1.3742976188659668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,32,1,balanced,0.36070934931437176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,32,1,balanced,0.3617173433303833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,32,1,power_law_1.01,0.3613375902175903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,32,1,power_law_1.01,0.36154239177703856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,32,1,power_law_1.2,0.3614784002304077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,32,1,power_law_1.2,0.36151039600372314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,4,1,balanced,0.8104106585184733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,4,1,balanced,0.8104906876881918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,4,1,power_law_1.01,0.8199616432189941
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,4,1,power_law_1.01,0.8231167793273926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,4,1,power_law_1.2,0.8270079612731933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,4,1,power_law_1.2,0.8276351928710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,8,1,balanced,0.5470986763636271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,8,1,balanced,0.5497119824091593
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,8,1,power_law_1.01,0.5549759864807129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,8,1,power_law_1.01,0.5570559978485108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,8,1,power_law_1.2,0.5525184154510498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,14336,2,8,8,1,power_law_1.2,0.5556928157806397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,1,balanced,1.4067519505818684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,1,balanced,1.4111253420511882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,1,power_law_1.01,1.4983424186706542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,1,power_law_1.01,1.5076224327087402
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,1,power_law_1.2,1.500723171234131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,1,power_law_1.2,1.519647979736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,128,balanced,0.2615306576093038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,128,balanced,0.26203733682632446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,128,power_law_1.01,0.31902079582214354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,128,power_law_1.01,0.3302783966064453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,128,power_law_1.2,0.3782272100448608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,128,power_law_1.2,0.379423999786377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,16,balanced,0.31912533442179364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,16,balanced,0.31918932994206745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,16,power_law_1.01,0.41587200164794924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,16,power_law_1.01,0.4233407974243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,16,power_law_1.2,0.460646390914917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,16,power_law_1.2,0.4845439910888672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,2,balanced,0.7928000291188558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,2,balanced,0.7954613367716471
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,2,power_law_1.01,0.9408512115478516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,2,power_law_1.01,0.9558143615722656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,2,power_law_1.2,0.9397055625915527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,2,power_law_1.2,0.942790412902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,32,balanced,0.2852426568667094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,32,balanced,0.2853920062383016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,32,power_law_1.01,0.37156479358673095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,32,power_law_1.01,0.37292160987854006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,32,power_law_1.2,0.43208961486816405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,32,power_law_1.2,0.45429120063781736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,4,balanced,0.5232959985733032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,4,balanced,0.5235360066095988
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,4,power_law_1.01,0.6498623847961426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,4,power_law_1.01,0.6521535873413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,4,power_law_1.2,0.6650944232940674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,4,power_law_1.2,0.7001279830932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,64,balanced,0.2683680057525635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,64,balanced,0.2685760060946147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,64,power_law_1.01,0.34456961154937743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,64,power_law_1.01,0.34810240268707277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,64,power_law_1.2,0.3864255905151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,64,power_law_1.2,0.4160895824432373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,8,balanced,0.388805349667867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,8,balanced,0.38943998018900555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,8,power_law_1.01,0.5087935924530029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,8,power_law_1.01,0.5243199825286865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,8,power_law_1.2,0.5303167819976806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,1,8,power_law_1.2,0.5933568000793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,2,1,balanced,0.9200159708658854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,2,1,balanced,0.9253493150075277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,2,1,power_law_1.01,0.9747776031494141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,2,1,power_law_1.01,0.97958402633667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,2,1,power_law_1.2,0.9777407646179199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,2,1,power_law_1.2,0.9806655883789063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,4,1,balanced,0.714799960454305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,4,1,balanced,0.718010663986206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,4,1,power_law_1.01,0.749235200881958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,4,1,power_law_1.01,0.7500607967376709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,4,1,power_law_1.2,0.7471039772033692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,4,1,power_law_1.2,0.7619135856628418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,8,1,balanced,0.6400800148646036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,8,1,balanced,0.6428159872690836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,8,1,power_law_1.01,0.6575232028961182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,8,1,power_law_1.01,0.6636352062225341
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,8,1,power_law_1.2,0.6661759853363037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,4096,1536,8,128,8,1,power_law_1.2,0.679148817062378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,1,balanced,5.763354619344075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,1,balanced,6.2502396901448565
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,1,power_law_1.01,4.94213752746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,1,power_law_1.01,4.99447021484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,1,power_law_1.2,4.933542251586914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,1,power_law_1.2,5.111033630371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,2,balanced,2.5972746213277182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,2,balanced,2.597930590311686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,2,power_law_1.01,3.346451187133789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,2,power_law_1.01,4.1661121368408205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,2,power_law_1.2,3.644339370727539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,2,power_law_1.2,3.73939208984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,4,balanced,1.4087732632954915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,4,balanced,1.426165262858073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,4,power_law_1.01,3.021062469482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,4,power_law_1.01,3.315379333496094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,4,power_law_1.2,2.848908805847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,4,power_law_1.2,2.8837440490722654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,8,balanced,0.8194293181101481
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,8,balanced,0.8353652954101562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,8,power_law_1.01,2.3679935455322267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,8,power_law_1.01,2.4477888107299806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,8,power_law_1.2,2.4795839309692385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,1,8,power_law_1.2,2.5533824920654298
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,16,1,balanced,0.601797342300415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,16,1,balanced,0.602949341138204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,16,1,power_law_1.01,0.60731520652771
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,16,1,power_law_1.01,0.6082304000854493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,16,1,power_law_1.2,0.6051519870758056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,16,1,power_law_1.2,0.6089344024658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,2,1,balanced,2.20523738861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,2,1,balanced,2.2563625971476235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,2,1,power_law_1.01,2.1923200607299806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,2,1,power_law_1.01,2.211359977722168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,2,1,power_law_1.2,2.183225631713867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,2,1,power_law_1.2,2.18988151550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,32,1,balanced,0.5023466746012369
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,32,1,balanced,0.5036960045496622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,32,1,power_law_1.01,0.5048511981964111
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,32,1,power_law_1.01,0.5068031787872315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,32,1,power_law_1.2,0.5040128231048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,32,1,power_law_1.2,0.5045567989349365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,4,1,balanced,1.2561546961466472
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,4,1,balanced,1.2606613636016846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,4,1,power_law_1.01,1.2726143836975097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,4,1,power_law_1.01,1.2828351974487304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,4,1,power_law_1.2,1.2820223808288573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,4,1,power_law_1.2,1.2831487655639648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,8,1,balanced,0.8268000284830729
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,8,1,balanced,0.8272639910380045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,8,1,power_law_1.01,0.8325440406799316
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,8,1,power_law_1.01,0.8349247932434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,8,1,power_law_1.2,0.8303296089172363
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,16384,2,8,8,1,power_law_1.2,0.8317184448242188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,1,balanced,2.7327518463134766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,1,balanced,2.7624053955078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,1,power_law_1.01,3.0344703674316404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,1,power_law_1.01,3.0838911056518556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,1,power_law_1.2,3.151411247253418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,1,power_law_1.2,3.1829952239990233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,128,balanced,0.36927998065948486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,128,balanced,0.36977601051330566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,128,power_law_1.01,0.4373760223388672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,128,power_law_1.01,0.44786558151245115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,128,power_law_1.2,0.5018176078796387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,128,power_law_1.2,0.510099220275879
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,16,balanced,0.48210132122039795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,16,balanced,0.48292267322540283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,16,power_law_1.01,0.6121151924133301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,16,power_law_1.01,0.6246016025543213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,16,power_law_1.2,0.6935423851013184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,16,power_law_1.2,0.7043263912200928
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,2,balanced,1.4709280331929524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,2,balanced,1.474671999613444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,2,power_law_1.01,1.7861440658569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,2,power_law_1.01,1.7947263717651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,2,power_law_1.2,1.8571392059326173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,2,power_law_1.2,1.9220224380493165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,256,balanced,0.3606133460998535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,256,balanced,0.3614773352940877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,256,power_law_1.01,0.41924481391906737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,256,power_law_1.01,0.4231743812561035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,256,power_law_1.2,0.5071743965148926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,256,power_law_1.2,0.5187967777252197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,32,balanced,0.42023468017578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,32,balanced,0.4206240177154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,32,power_law_1.01,0.5296000003814697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,32,power_law_1.01,0.5368768215179444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,32,power_law_1.2,0.6300543785095215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,32,power_law_1.2,0.6383615970611572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,4,balanced,0.8877653280893961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,4,balanced,0.8899626731872559
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,4,power_law_1.01,1.1037887573242187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,4,power_law_1.01,1.1225343704223634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,4,power_law_1.2,1.1658944129943847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,4,power_law_1.2,1.2881216049194335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,64,balanced,0.381658673286438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,64,balanced,0.3826719919840495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,64,power_law_1.01,0.4806272029876709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,64,power_law_1.01,0.4849535942077637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,64,power_law_1.2,0.5525119781494141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,64,power_law_1.2,0.5628992080688476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,8,balanced,0.6118826468785604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,8,balanced,0.6135146617889404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,8,power_law_1.01,0.8012672424316406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,8,power_law_1.01,0.827724838256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,8,power_law_1.2,0.8873279571533204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,1,8,power_law_1.2,0.8944255828857421
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,16,1,balanced,0.8094186782836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,16,1,balanced,0.809770663579305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,16,1,power_law_1.01,0.8638655662536621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,16,1,power_law_1.01,0.8687616348266601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,16,1,power_law_1.2,0.8779775619506835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,16,1,power_law_1.2,0.8876480102539063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,2,1,balanced,1.5998133023579915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,2,1,balanced,1.6034560203552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,2,1,power_law_1.01,1.8330303192138673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,2,1,power_law_1.01,1.8547391891479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,2,1,power_law_1.2,1.864908790588379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,2,1,power_law_1.2,1.8720703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,32,1,balanced,0.8286080360412598
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,32,1,balanced,0.8290293216705322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,32,1,power_law_1.01,0.8842495918273926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,32,1,power_law_1.01,0.8872960090637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,32,1,power_law_1.2,0.896121597290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,32,1,power_law_1.2,0.9086463928222657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,4,1,balanced,1.1168533166249592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,4,1,balanced,1.121776024500529
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,4,1,power_law_1.01,1.2377920150756836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,4,1,power_law_1.01,1.2410176277160645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,4,1,power_law_1.2,1.2691264152526855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,4,1,power_law_1.2,1.278003215789795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,8,1,balanced,0.8959360122680664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,8,1,balanced,0.8970773220062256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,8,1,power_law_1.01,0.9751744270324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,8,1,power_law_1.01,0.9760512351989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,8,1,power_law_1.2,0.9872703552246094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2048,8,256,8,1,power_law_1.2,1.006822395324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,1,balanced,3.138352076212565
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,1,balanced,3.1551198959350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,1,power_law_1.01,3.3631359100341798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,1,power_law_1.01,3.4047550201416015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,1,power_law_1.2,3.3790592193603515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,1,power_law_1.2,3.5004928588867186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,16,balanced,0.5116480191548666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,16,balanced,0.5120160182317098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,16,power_law_1.01,0.717625617980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,16,power_law_1.01,0.7338751792907715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,16,power_law_1.2,0.8229375839233398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,16,power_law_1.2,0.8246912002563477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,2,balanced,1.702986717224121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,2,balanced,1.704250653584798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,2,power_law_1.01,1.9745088577270509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,2,power_law_1.01,2.073139190673828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,2,power_law_1.2,1.9053184509277343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,2,power_law_1.2,1.9190271377563477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,32,balanced,0.4316106637318929
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,32,balanced,0.4329386552174886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,32,power_law_1.01,0.5969024181365967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,32,power_law_1.01,0.6406015872955322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,32,power_law_1.2,0.6958079814910889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,32,power_law_1.2,0.7086592197418213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,4,balanced,0.9985333283742269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,4,balanced,1.0064586798350017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,4,power_law_1.01,1.287820816040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,4,power_law_1.01,1.3558015823364258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,4,power_law_1.2,1.2839872360229492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,4,power_law_1.2,1.4040575981140138
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,8,balanced,0.6748639742533366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,8,balanced,0.6760906378428141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,8,power_law_1.01,0.8836223602294921
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,8,power_law_1.01,0.9381888389587403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,8,power_law_1.2,0.9674943923950196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,1,8,power_law_1.2,1.0282048225402831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,2,1,balanced,1.8524266878763835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,2,1,balanced,1.856346607208252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,2,1,power_law_1.01,2.000454330444336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,2,1,power_law_1.01,2.0131263732910156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,2,1,power_law_1.2,1.9963392257690429
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,2,1,power_law_1.2,2.003001594543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,4,1,balanced,1.2667146523793538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,4,1,balanced,1.2826720078786213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,4,1,power_law_1.01,1.3505087852478028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,4,1,power_law_1.01,1.3598848342895509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,4,1,power_law_1.2,1.361843204498291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,4,1,power_law_1.2,1.3756863594055175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,8,1,balanced,1.0327359835306804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,8,1,balanced,1.0463893413543701
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,8,1,power_law_1.01,1.0841664314270019
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,8,1,power_law_1.01,1.0871871948242187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,8,1,power_law_1.2,1.0932160377502442
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,6144,2560,8,160,8,1,power_law_1.2,1.1151103973388672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,1,balanced,3.076047897338867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,1,balanced,3.1431573232014975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,1,power_law_1.01,3.607603073120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,1,power_law_1.01,3.618726348876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,1,power_law_1.2,3.6506816864013674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,1,power_law_1.2,3.7370174407958983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,128,balanced,0.4230773448944092
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,128,balanced,0.42483198642730713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,128,power_law_1.01,0.5059584140777588
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,128,power_law_1.01,0.5227968215942382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,128,power_law_1.2,0.5898943901062011
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,128,power_law_1.2,0.5971776008605957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,16,balanced,0.554197351137797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,16,balanced,0.5549173355102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,16,power_law_1.01,0.7006720066070556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,16,power_law_1.01,0.7038720130920411
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,16,power_law_1.2,0.7500224113464355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,16,power_law_1.2,0.7921088218688965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,2,balanced,1.6889813741048176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,2,balanced,1.7045119603474934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,2,power_law_1.01,2.0327680587768553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,2,power_law_1.01,2.0491199493408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,2,power_law_1.2,2.129964828491211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,2,power_law_1.2,2.288159942626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,256,balanced,0.41276800632476807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,256,power_law_1.01,0.48254079818725587
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,256,power_law_1.01,0.4941887855529785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,256,power_law_1.2,0.580838394165039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,256,power_law_1.2,0.5916927814483642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,32,balanced,0.4817066589991252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,32,balanced,0.48265600204467773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,32,power_law_1.01,0.6227327823638916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,32,power_law_1.01,0.6254208087921143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,32,power_law_1.2,0.6819200038909912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,32,power_law_1.2,0.6945087909698486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,4,balanced,1.0231306552886963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,4,balanced,1.0289493401845295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,4,power_law_1.01,1.2588543891906738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,4,power_law_1.01,1.2709312438964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,4,power_law_1.2,1.447590446472168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,4,power_law_1.2,1.4621503829956055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,64,balanced,0.4405279954274495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,64,balanced,0.4406133492787679
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,64,power_law_1.01,0.5565311908721924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,64,power_law_1.01,0.5703167915344238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,64,power_law_1.2,0.6140543937683105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,64,power_law_1.2,0.6281343936920166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,8,balanced,0.7031146685282389
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,8,balanced,0.7067253589630127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,8,power_law_1.01,0.8851967811584472
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,8,power_law_1.01,0.9090047836303711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,8,power_law_1.2,0.9804863929748535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,1,8,power_law_1.2,1.00065279006958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,16,1,balanced,0.9343146483103434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,16,1,balanced,0.936293363571167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,16,1,power_law_1.01,0.9905152320861816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,16,1,power_law_1.01,0.9976384162902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,16,1,power_law_1.2,1.0076352119445802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,16,1,power_law_1.2,1.0114432334899903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,2,1,balanced,1.8521386782328289
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,2,1,balanced,1.8614667256673176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,2,1,power_law_1.01,2.1307647705078123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,2,1,power_law_1.01,2.166361618041992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,2,1,power_law_1.2,2.1755008697509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,2,1,power_law_1.2,2.1972543716430666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,32,1,balanced,0.957045316696167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,32,1,balanced,0.9583679835001627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,32,1,power_law_1.01,1.0241984367370605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,32,1,power_law_1.01,1.02542724609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,32,1,power_law_1.2,1.0357376098632813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,32,1,power_law_1.2,1.043462371826172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,4,1,balanced,1.2950987021128337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,4,1,balanced,1.3049386342366536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,4,1,power_law_1.01,1.4357376098632812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,4,1,power_law_1.01,1.4435327529907227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,4,1,power_law_1.2,1.4650943756103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,4,1,power_law_1.2,1.4777983665466308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,8,1,balanced,1.0407040119171143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,8,1,balanced,1.0408746401468914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,8,1,power_law_1.01,1.121286392211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,8,1,power_law_1.01,1.1283583641052246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,8,1,power_law_1.2,1.1424768447875977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,256,8,1,power_law_1.2,1.1547391891479493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,1,balanced,3.199632008870443
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,1,balanced,3.3037281036376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,1,power_law_1.01,3.9076606750488283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,1,power_law_1.01,3.998099136352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,1,power_law_1.2,4.164486312866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,1,power_law_1.2,4.261344146728516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,128,balanced,0.4228373368581136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,128,balanced,0.42559464772542316
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,128,power_law_1.01,0.4977151870727539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,128,power_law_1.01,0.503929615020752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,128,power_law_1.2,0.5535999774932862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,128,power_law_1.2,0.5688896179199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,16,balanced,0.56004265944163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,16,balanced,0.5612906614939371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,16,power_law_1.01,0.6978879928588867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,16,power_law_1.01,0.7147200107574463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,16,power_law_1.2,0.7747392177581787
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,16,power_law_1.2,0.7826943874359131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,2,balanced,1.7909760475158691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,2,balanced,1.7918880780537922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,2,power_law_1.01,2.234841537475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,2,power_law_1.01,2.2378368377685547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,2,power_law_1.2,2.327903938293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,2,power_law_1.2,2.404812812805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,32,balanced,0.4838080008824666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,32,balanced,0.484991987546285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,32,power_law_1.01,0.5919551849365234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,32,power_law_1.01,0.6036479949951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,32,power_law_1.2,0.6504191875457763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,32,power_law_1.2,0.6652544021606446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,4,balanced,1.0583786964416504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,4,balanced,1.0630933443705242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,4,power_law_1.01,1.35729923248291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,4,power_law_1.01,1.4124799728393556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,4,power_law_1.2,1.4331328392028808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,4,power_law_1.2,1.4692352294921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,64,balanced,0.4410880009333293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,64,balanced,0.44121599197387695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,64,power_law_1.01,0.5310783863067627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,64,power_law_1.01,0.5359039783477784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,64,power_law_1.2,0.5926208019256591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,64,power_law_1.2,0.6002943992614747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,8,balanced,0.723632017771403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,8,balanced,0.7243039608001709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,8,power_law_1.01,0.9351424217224121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,8,power_law_1.01,0.9705535888671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,8,power_law_1.2,1.024665641784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,1,8,power_law_1.2,1.0798720359802245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,16,1,balanced,0.949023962020874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,16,1,balanced,0.949951966603597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,16,1,power_law_1.01,1.025657558441162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,16,1,power_law_1.01,1.0276224136352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,16,1,power_law_1.2,1.047225570678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,16,1,power_law_1.2,1.0516863822937013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,2,1,balanced,1.9452800750732422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,2,1,balanced,1.9781333605448406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,2,1,power_law_1.01,2.2882047653198243
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,2,1,power_law_1.01,2.289625549316406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,2,1,power_law_1.2,2.3493440628051756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,2,1,power_law_1.2,2.405504035949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,32,1,balanced,0.9615893363952637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,32,1,balanced,0.962778647740682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,32,1,power_law_1.01,1.0513600349426269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,32,1,power_law_1.01,1.0613375663757325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,32,1,power_law_1.2,1.0651328086853027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,32,1,power_law_1.2,1.0766719818115233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,4,1,balanced,1.3347412745157878
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,4,1,balanced,1.3391200701395671
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,4,1,power_law_1.01,1.5200063705444335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,4,1,power_law_1.01,1.52871675491333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,4,1,power_law_1.2,1.576313591003418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,4,1,power_law_1.2,1.5763327598571777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,8,1,balanced,1.0593760013580322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,8,1,balanced,1.061077356338501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,8,1,power_law_1.01,1.174937629699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,8,1,power_law_1.01,1.1769087791442872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,8,1,power_law_1.2,1.1988224029541015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,12288,7168,2048,8,384,8,1,power_law_1.2,1.2050496101379395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,1,balanced,0.08450133601824443
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,1,balanced,0.0846560001373291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,1,power_law_1.01,0.08573439717292786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,1,power_law_1.01,0.08605440258979798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,1,power_law_1.2,0.08565760254859925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,1,power_law_1.2,0.0856768012046814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,128,balanced,0.037402667105197906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,128,balanced,0.03754666695992152
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,128,power_law_1.01,0.0353408008813858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,128,power_law_1.01,0.035366401076316833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,128,power_law_1.2,0.03457280099391937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,128,power_law_1.2,0.03484799861907959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,16,balanced,0.03363733241955439
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,16,balanced,0.03369066615899404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,16,power_law_1.01,0.0321152001619339
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,16,power_law_1.01,0.03223040103912354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,16,power_law_1.2,0.03206399977207184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,16,power_law_1.2,0.0328000009059906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,2,balanced,0.058373332023620605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,2,balanced,0.05871466795603434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,2,power_law_1.01,0.06069759726524353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,2,power_law_1.01,0.061286401748657224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,2,power_law_1.2,0.05994240045547485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,2,power_law_1.2,0.06099200248718262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,32,balanced,0.03765333443880081
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,32,balanced,0.03822933385769526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,32,power_law_1.01,0.036595198512077334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,32,power_law_1.01,0.03697279989719391
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,32,power_law_1.2,0.035750401020050046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,32,power_law_1.2,0.03578880131244659
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,4,balanced,0.03910933434963226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,4,balanced,0.04018666595220566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,4,power_law_1.01,0.04036479890346527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,4,power_law_1.01,0.041075199842453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,4,power_law_1.2,0.04073599874973297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,4,power_law_1.2,0.04215039908885956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,64,balanced,0.03754133234421412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,64,balanced,0.03766400118668874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,64,power_law_1.01,0.03529599905014038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,64,power_law_1.01,0.03590399920940399
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,64,power_law_1.2,0.034892800450325015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,64,power_law_1.2,0.03506560027599335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,8,balanced,0.03550933301448822
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,8,balanced,0.03566933423280716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,8,power_law_1.01,0.03434880077838898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,8,power_law_1.01,0.03460479974746704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,8,power_law_1.2,0.03467519879341126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,1,8,power_law_1.2,0.035129600763320924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,2,1,balanced,0.06033066908518473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,2,1,balanced,0.06195199986298879
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,2,1,power_law_1.01,0.061382400989532473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,2,1,power_law_1.01,0.06261119842529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,2,1,power_law_1.2,0.0615231990814209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,2,1,power_law_1.2,0.06222079992294312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,4,1,balanced,0.04320533573627472
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,4,1,balanced,0.04571199913819631
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,4,1,power_law_1.01,0.04811519980430603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,4,1,power_law_1.01,0.04976640045642853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,4,1,power_law_1.2,0.04863359928131104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,2048,768,8,128,4,1,power_law_1.2,0.049491199851036075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,1,balanced,0.3182400067647298
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,1,balanced,0.318725327650706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,1,power_law_1.01,0.26296319961547854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,1,power_law_1.01,0.26711039543151854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,1,power_law_1.2,0.2668800115585327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,1,power_law_1.2,0.2685247898101807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,128,balanced,0.05203733344872793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,128,balanced,0.05241066714127859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,128,power_law_1.01,0.049395200610160825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,128,power_law_1.01,0.04973439872264862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,128,power_law_1.2,0.04833920001983642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,128,power_law_1.2,0.049267199635505673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,16,balanced,0.0537066658337911
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,16,balanced,0.05421866476535797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,16,power_law_1.01,0.04844799935817719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,16,power_law_1.01,0.050316798686981204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,16,power_law_1.2,0.04929920136928558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,16,power_law_1.2,0.05011199712753296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,2,balanced,0.17678399880727133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,2,balanced,0.17684266964594522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,2,power_law_1.01,0.15204479694366455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,2,power_law_1.01,0.15774719715118407
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,2,power_law_1.2,0.15244799852371216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,2,power_law_1.2,0.15406719446182252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,256,balanced,0.04357333481311798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,256,balanced,0.04402133325735728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,256,power_law_1.01,0.04063999950885773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,256,power_law_1.01,0.04088320136070252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,256,power_law_1.2,0.04056319892406464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,256,power_law_1.2,0.0409280002117157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,32,balanced,0.05136000116666158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,32,balanced,0.05156266689300537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,32,power_law_1.01,0.04503679871559143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,32,power_law_1.01,0.047891199588775635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,32,power_law_1.2,0.0443583995103836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,32,power_law_1.2,0.045023998618125914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,4,balanced,0.10616532961527507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,4,balanced,0.10669333736101787
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,4,power_law_1.01,0.09226239919662475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,4,power_law_1.01,0.09671040177345276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,4,power_law_1.2,0.09074559807777405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,4,power_law_1.2,0.09260799884796142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,64,balanced,0.06640000144640605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,64,balanced,0.06643733382225037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,64,power_law_1.01,0.0588096022605896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,64,power_law_1.01,0.06159359812736511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,64,power_law_1.2,0.05687680244445801
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,64,power_law_1.2,0.05952640175819397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,8,balanced,0.07044266661008199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,8,balanced,0.07145600020885468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,8,power_law_1.01,0.06444159746170045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,8,power_law_1.01,0.06652799844741822
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,8,power_law_1.2,0.0657472014427185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,1,8,power_law_1.2,0.06591359972953796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,2,1,balanced,0.1789813240369161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,2,1,balanced,0.18026133378346762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,2,1,power_law_1.01,0.15442559719085694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,2,1,power_law_1.01,0.15546239614486695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,2,1,power_law_1.2,0.1531391978263855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,2,1,power_law_1.2,0.15413119792938232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,4,1,balanced,0.11104533076286316
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,4,1,balanced,0.11345600088437398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,4,1,power_law_1.01,0.09801599979400635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,4,1,power_law_1.01,0.10087039470672607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,4,1,power_law_1.2,0.10172799825668336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,4,1,power_law_1.2,0.10177919864654542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,8,1,balanced,0.08251733581225078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,8,1,balanced,0.08309866487979889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,8,1,power_law_1.01,0.07727360129356384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,8,1,power_law_1.01,0.07845759987831116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,8,1,power_law_1.2,0.07797120213508606
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,3072,1536,8,256,8,1,power_law_1.2,0.07800959944725036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,1,balanced,0.1810986598332723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,1,balanced,0.1818079948425293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,1,power_law_1.01,0.2051392078399658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,1,power_law_1.01,0.20767359733581542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,1,power_law_1.2,0.20684800148010254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,1,power_law_1.2,0.20974719524383545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,2,balanced,0.09304533402125041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,2,balanced,0.0946560005346934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,2,power_law_1.01,0.11235840320587158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,2,power_law_1.01,0.1128000020980835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,2,power_law_1.2,0.11459840536117553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,2,power_law_1.2,0.11712000370025635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,4,balanced,0.09219732880592346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,4,balanced,0.09226666887601216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,4,power_law_1.01,0.07562239766120911
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,4,power_law_1.01,0.0782912015914917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,4,power_law_1.2,0.07505279779434204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,4,power_law_1.2,0.07913600206375122
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,8,balanced,0.16337600350379944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,8,balanced,0.16475733121236166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,8,power_law_1.01,0.059385597705841064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,8,power_law_1.01,0.059513598680496216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,8,power_law_1.2,0.058963197469711306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,1,8,power_law_1.2,0.06716799736022949
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,16,1,balanced,0.03572266548871994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,16,1,balanced,0.03625600039958954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,16,1,power_law_1.01,0.035820800065994265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,16,1,power_law_1.01,0.037088000774383546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,16,1,power_law_1.2,0.03480960130691528
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,16,1,power_law_1.2,0.036556801199913024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,2,1,balanced,0.10127466917037964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,2,1,balanced,0.10203199585278828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,2,1,power_law_1.01,0.11431039571762085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,2,1,power_law_1.01,0.11653759479522705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,2,1,power_law_1.2,0.11559679508209228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,2,1,power_law_1.2,0.11660159826278686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,32,1,balanced,0.03347733368476232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,32,1,balanced,0.03359466542800268
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,32,1,power_law_1.01,0.03224320113658905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,32,1,power_law_1.01,0.03243519961833954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,32,1,power_law_1.2,0.032307198643684386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,32,1,power_law_1.2,0.032716798782348636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,4,1,balanced,0.07043733199437459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,4,1,balanced,0.07065600156784058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,4,1,power_law_1.01,0.07320320010185241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,4,1,power_law_1.01,0.07367680072784424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,4,1,power_law_1.2,0.07059199810028076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,4,1,power_law_1.2,0.0726207971572876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,8,1,balanced,0.051221330960591636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,8,1,balanced,0.05197866757710775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,8,1,power_law_1.01,0.05111039876937866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,8,1,power_law_1.01,0.05173119902610779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,8,1,power_law_1.2,0.05135359764099121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,14336,2,8,8,1,power_law_1.2,0.05145599842071533
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,1,balanced,0.22853867212931314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,1,balanced,0.22858132918675741
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,1,power_law_1.01,0.2314176082611084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,1,power_law_1.01,0.2355263948440552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,1,power_law_1.2,0.2330751895904541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,1,power_law_1.2,0.2358975887298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,128,balanced,0.0397119993964831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,128,balanced,0.03996799886226654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,128,power_law_1.01,0.03930239975452423
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,128,power_law_1.01,0.039827200770378116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,128,power_law_1.2,0.0392192006111145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,128,power_law_1.2,0.03996799886226654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,16,balanced,0.05411200225353241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,16,balanced,0.054799998799959816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,16,power_law_1.01,0.04799999892711639
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,16,power_law_1.01,0.05001599788665771
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,16,power_law_1.2,0.046105599403381346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,16,power_law_1.2,0.04780159890651703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,2,balanced,0.13152533769607544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,2,balanced,0.13383466998736063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,2,power_law_1.01,0.1321727991104126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,2,power_law_1.01,0.13276159763336182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,2,power_law_1.2,0.13452160358428955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,2,power_law_1.2,0.13661439418792726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,32,balanced,0.06651199857393901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,32,balanced,0.06679999828338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,32,power_law_1.01,0.05726720094680786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,32,power_law_1.01,0.057555198669433594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,32,power_law_1.2,0.057651197910308837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,32,power_law_1.2,0.058841598033905027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,4,balanced,0.08416533470153809
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,4,balanced,0.08461333314577739
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,4,power_law_1.01,0.08227840065956116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,4,power_law_1.01,0.082777601480484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,4,power_law_1.2,0.08065279722213745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,4,power_law_1.2,0.08321279883384705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,64,balanced,0.04155733436346054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,64,balanced,0.041936000188191734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,64,power_law_1.01,0.040140798687934874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,64,power_law_1.01,0.04037759900093078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,64,power_law_1.2,0.03953920006752014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,64,power_law_1.2,0.04032639861106872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,8,balanced,0.062314664324124656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,8,balanced,0.06235733131567637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,8,power_law_1.01,0.05817599892616272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,8,power_law_1.01,0.05995519757270813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,8,power_law_1.2,0.060684800148010254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,1,8,power_law_1.2,0.061587202548980716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,2,1,balanced,0.1344266633192698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,2,1,balanced,0.13480533162752786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,2,1,power_law_1.01,0.13972480297088624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,2,1,power_law_1.01,0.1416767954826355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,2,1,power_law_1.2,0.1406399965286255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,2,1,power_law_1.2,0.14300160408020018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,4,1,balanced,0.08891200025876363
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,4,1,balanced,0.08925867080688477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,4,1,power_law_1.01,0.09137279987335205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,4,1,power_law_1.01,0.09232640266418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,4,1,power_law_1.2,0.09308159947395325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,4,1,power_law_1.2,0.09410560131072998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,8,1,balanced,0.0684799998998642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,8,1,balanced,0.07011199990908305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,8,1,power_law_1.01,0.07299200296401978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,8,1,power_law_1.01,0.07351679801940918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,8,1,power_law_1.2,0.07221760153770447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,4096,1536,8,128,8,1,power_law_1.2,0.0735040009021759
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,1,balanced,0.3622453212738037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,1,balanced,0.36236798763275146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,1,power_law_1.01,0.4195199966430664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,1,power_law_1.01,0.43259520530700685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,1,power_law_1.2,0.41503357887268066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,1,power_law_1.2,0.4250432014465332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,2,balanced,0.13828800121943155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,2,balanced,0.14050133029619852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,2,power_law_1.01,0.19738240242004396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,2,power_law_1.01,0.2033600091934204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,2,power_law_1.2,0.19052799940109252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,2,power_law_1.2,0.19845759868621826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,4,balanced,0.10637866457303365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,4,balanced,0.10801066954930623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,4,power_law_1.01,0.11182719469070435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,4,power_law_1.01,0.11495039463043213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,4,power_law_1.2,0.10536320209503174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,4,power_law_1.2,0.11208319664001465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,8,balanced,0.1753013332684835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,8,balanced,0.18569600582122803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,8,power_law_1.01,0.07175679802894593
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,8,power_law_1.01,0.07219840288162231
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,8,power_law_1.2,0.07133439779281617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,1,8,power_law_1.2,0.07207040190696716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,16,1,balanced,0.04739200075467428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,16,1,balanced,0.04879466692606608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,16,1,power_law_1.01,0.04760960042476654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,16,1,power_law_1.01,0.04826880097389221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,16,1,power_law_1.2,0.04766719937324524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,16,1,power_law_1.2,0.048204800486564635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,2,1,balanced,0.14998933672904968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,2,1,balanced,0.15187733372052512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,2,1,power_law_1.01,0.1732095956802368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,2,1,power_law_1.01,0.17530239820480348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,2,1,power_law_1.2,0.17583999633789063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,2,1,power_law_1.2,0.17812479734420777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,32,1,balanced,0.03543466577927271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,32,1,balanced,0.03733866661787033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,32,1,power_law_1.01,0.03680639863014221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,32,1,power_law_1.01,0.03772160112857818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,32,1,power_law_1.2,0.0367935985326767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,32,1,power_law_1.2,0.03695360124111176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,4,1,balanced,0.09353066484133403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,4,1,balanced,0.09381332993507385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,4,1,power_law_1.01,0.10274560451507568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,4,1,power_law_1.01,0.10423040390014648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,4,1,power_law_1.2,0.10240000486373901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,4,1,power_law_1.2,0.10358400344848633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,8,1,balanced,0.0643093337615331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,8,1,balanced,0.06538666784763336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,8,1,power_law_1.01,0.06672639846801758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,8,1,power_law_1.01,0.06840320229530335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,8,1,power_law_1.2,0.0669376015663147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,16384,2,8,8,1,power_law_1.2,0.06744319796562195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,1,balanced,0.7846506436665853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,1,balanced,0.7863039970397949
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,1,power_law_1.01,0.6409023761749267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,1,power_law_1.01,0.6493055820465088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,1,power_law_1.2,0.6483839988708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,1,power_law_1.2,0.6817215919494629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,128,balanced,0.06320000191529591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,128,balanced,0.06638399759928386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,128,power_law_1.01,0.058931201696395874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,128,power_law_1.01,0.058982402086257935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,128,power_law_1.2,0.05707520246505737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,128,power_law_1.2,0.05805439949035644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,16,balanced,0.08752000331878662
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,16,balanced,0.08798933029174805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,16,power_law_1.01,0.07720959782600403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,16,power_law_1.01,0.08051199913024902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,16,power_law_1.2,0.07813760042190551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,16,power_law_1.2,0.08254079818725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,2,balanced,0.41124268372853595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,2,balanced,0.4135306676228841
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,2,power_law_1.01,0.3398591995239258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,2,power_law_1.01,0.3427455902099609
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,2,power_law_1.2,0.36055679321289064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,2,power_law_1.2,0.3646591901779175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,256,balanced,0.0440586656332016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,256,balanced,0.044213334719340004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,256,power_law_1.01,0.042822399735450746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,256,power_law_1.01,0.04335359930992126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,256,power_law_1.2,0.04239999949932098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,256,power_law_1.2,0.042822399735450746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,32,balanced,0.08660800258318584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,32,balanced,0.08927466471989949
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,32,power_law_1.01,0.07274240255355835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,32,power_law_1.01,0.07774080038070678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,32,power_law_1.2,0.06912000179290771
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,32,power_law_1.2,0.07146239876747132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,4,balanced,0.22450133164723715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,4,balanced,0.22500266631444296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,4,power_law_1.01,0.19090559482574462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,4,power_law_1.01,0.19902080297470093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,4,power_law_1.2,0.1877120018005371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,4,power_law_1.2,0.19292160272598266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,64,balanced,0.11184533437093098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,64,balanced,0.11218667030334473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,64,power_law_1.01,0.09303680062294006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,64,power_law_1.01,0.09966719746589661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,64,power_law_1.2,0.09507840275764465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,64,power_law_1.2,0.09696000218391418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,8,balanced,0.13327999909718832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,8,balanced,0.13406933347384134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,8,power_law_1.01,0.11575679779052735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,8,power_law_1.01,0.12065279483795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,8,power_law_1.2,0.11752959489822387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,1,8,power_law_1.2,0.12050559520721435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,16,1,balanced,0.11181333661079407
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,16,1,balanced,0.11198932925860088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,16,1,power_law_1.01,0.10533759593963624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,16,1,power_law_1.01,0.10712959766387939
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,16,1,power_law_1.2,0.10506880283355713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,16,1,power_law_1.2,0.10574079751968384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,2,1,balanced,0.41376535097757977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,2,1,balanced,0.4144586722056071
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,2,1,power_law_1.01,0.34606080055236815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,2,1,power_law_1.01,0.35383679866790774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,2,1,power_law_1.2,0.34752640724182127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,2,1,power_law_1.2,0.34856960773468015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,32,1,balanced,0.09502933422724406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,32,1,balanced,0.09505599737167358
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,32,1,power_law_1.01,0.09039999842643738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,32,1,power_law_1.01,0.09048960208892823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,32,1,power_law_1.2,0.09082880020141601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,32,1,power_law_1.2,0.09168639779090881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,4,1,balanced,0.22950933376948038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,4,1,balanced,0.23071465889612833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,4,1,power_law_1.01,0.19726719856262206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,4,1,power_law_1.01,0.19742079973220825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,4,1,power_law_1.2,0.1955072045326233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,4,1,power_law_1.2,0.20093441009521484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,8,1,balanced,0.1455519994099935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,8,1,balanced,0.14593066771825156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,8,1,power_law_1.01,0.13052799701690673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,8,1,power_law_1.01,0.13427200317382812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,8,1,power_law_1.2,0.13251839876174926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2048,8,256,8,1,power_law_1.2,0.13446400165557862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,1,balanced,0.6245386600494385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,1,balanced,0.6263519922892252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,1,power_law_1.01,0.5950143814086915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,1,power_law_1.01,0.6000576019287109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,1,power_law_1.2,0.6186816215515136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,1,power_law_1.2,0.6274816036224365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,16,balanced,0.10440533359845479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,16,balanced,0.10599467158317566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,16,power_law_1.01,0.09084799885749817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,16,power_law_1.01,0.09266560077667237
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,16,power_law_1.2,0.08920959830284118
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,16,power_law_1.2,0.09308159947395325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,2,balanced,0.3317173322041829
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,2,balanced,0.3325493335723877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,2,power_law_1.01,0.31679999828338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,2,power_law_1.01,0.3283967971801758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,2,power_law_1.2,0.32702078819274905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,2,power_law_1.2,0.3295232057571411
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,32,balanced,0.1777013341585795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,32,balanced,0.18622400363286337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,32,power_law_1.01,0.1414528012275696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,32,power_law_1.01,0.15074559450149536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,32,power_law_1.2,0.1393728017807007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,32,power_law_1.2,0.14714879989624025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,4,balanced,0.18588266770044962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,4,balanced,0.18652800718943277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,4,power_law_1.01,0.17170560359954834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,4,power_law_1.01,0.1764672040939331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,4,power_law_1.2,0.1754240036010742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,4,power_law_1.2,0.1786687970161438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,8,balanced,0.11542933185895284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,8,balanced,0.11548266808191936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,8,power_law_1.01,0.10535039901733398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,8,power_law_1.01,0.11027840375900269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,8,power_law_1.2,0.11013760566711425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,1,8,power_law_1.2,0.11051520109176635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,2,1,balanced,0.3339039882024129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,2,1,balanced,0.33409066994984943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,2,1,power_law_1.01,0.3192512035369873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,2,1,power_law_1.01,0.33113598823547363
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,2,1,power_law_1.2,0.3305984020233154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,2,1,power_law_1.2,0.33583359718322753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,4,1,balanced,0.19559999306996664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,4,1,balanced,0.19564799467722574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,4,1,power_law_1.01,0.19212160110473633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,4,1,power_law_1.01,0.19767040014266968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,4,1,power_law_1.2,0.2039936065673828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,4,1,power_law_1.2,0.20485761165618896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,8,1,balanced,0.12221866846084595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,8,1,balanced,0.12340266505877177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,8,1,power_law_1.01,0.12295039892196655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,8,1,power_law_1.01,0.12449920177459717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,8,1,power_law_1.2,0.12483199834823608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,6144,2560,8,160,8,1,power_law_1.2,0.1249343991279602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,1,balanced,0.9112693468729655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,1,balanced,0.9129066467285156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,1,power_law_1.01,0.7663167953491211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,1,power_law_1.01,0.771014404296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,1,power_law_1.2,0.767628812789917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,1,power_law_1.2,0.7744383811950684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,128,balanced,0.07086400190989177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,128,balanced,0.07206400235493977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,128,power_law_1.01,0.0639743983745575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,128,power_law_1.01,0.06602879762649536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,128,power_law_1.2,0.06421759724617004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,128,power_law_1.2,0.06604160070419311
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,16,balanced,0.09730133414268494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,16,balanced,0.09844266374905904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,16,power_law_1.01,0.0889087975025177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,16,power_law_1.01,0.09223679900169372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,16,power_law_1.2,0.08787840008735656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,16,power_law_1.2,0.09066879749298096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,2,balanced,0.47419734795888263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,2,balanced,0.47543466091156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,2,power_law_1.01,0.3892159938812256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,2,power_law_1.01,0.39234559535980223
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,2,power_law_1.2,0.3995136022567749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,2,power_law_1.2,0.41396479606628417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,256,balanced,0.04780800143877665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,256,balanced,0.04789333542188009
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,256,power_law_1.01,0.04444159865379334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,256,power_law_1.01,0.044896000623703004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,256,power_law_1.2,0.04457600116729736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,256,power_law_1.2,0.04475519955158234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,32,balanced,0.09179733196894328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,32,balanced,0.09190932909647624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,32,power_law_1.01,0.07904639840126038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,32,power_law_1.01,0.08405759930610657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,32,power_law_1.2,0.08343679904937744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,32,power_law_1.2,0.0850048005580902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,4,balanced,0.2571573257446289
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,4,balanced,0.25896533330281574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,4,power_law_1.01,0.22269439697265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,4,power_law_1.01,0.23169279098510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,4,power_law_1.2,0.2128448009490967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,4,power_law_1.2,0.24403839111328124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,64,balanced,0.13275200128555298
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,64,balanced,0.13433600465456644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,64,power_law_1.01,0.10689280033111573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,64,power_law_1.01,0.1142848014831543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,64,power_law_1.2,0.11148799657821655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,64,power_law_1.2,0.11187200546264649
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,8,balanced,0.15028267105420431
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,8,balanced,0.15065600474675497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,8,power_law_1.01,0.1323456048965454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,8,power_law_1.01,0.1339840054512024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,8,power_law_1.2,0.13730560541152953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,1,8,power_law_1.2,0.13925119638442993
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,16,1,balanced,0.12595733006795248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,16,1,balanced,0.12796800335248312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,16,1,power_law_1.01,0.11866879463195801
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,16,1,power_law_1.01,0.12016639709472657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,16,1,power_law_1.2,0.11900160312652588
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,16,1,power_law_1.2,0.11972479820251465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,2,1,balanced,0.47755734125773114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,2,1,balanced,0.4787360032399495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,2,1,power_law_1.01,0.4039167881011963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,2,1,power_law_1.01,0.40403199195861816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,2,1,power_law_1.2,0.39836161136627196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,2,1,power_law_1.2,0.40128002166748045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,32,1,balanced,0.10598933696746826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,32,1,balanced,0.10714667042096455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,32,1,power_law_1.01,0.10085760354995728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,32,1,power_law_1.01,0.101254403591156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,32,1,power_law_1.2,0.10287359952926636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,32,1,power_law_1.2,0.10357760190963745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,4,1,balanced,0.2638240059216817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,4,1,balanced,0.2654026746749878
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,4,1,power_law_1.01,0.22422399520874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,4,1,power_law_1.01,0.23033599853515624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,4,1,power_law_1.2,0.22692480087280273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,4,1,power_law_1.2,0.22783999443054198
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,8,1,balanced,0.16595733165740967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,8,1,balanced,0.16682666540145874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,8,1,power_law_1.01,0.14873600006103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,8,1,power_law_1.01,0.15119999647140503
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,8,1,power_law_1.2,0.1491520047187805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,256,8,1,power_law_1.2,0.1541375994682312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,1,balanced,1.3397332827250164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,1,balanced,1.3408586184183757
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,1,power_law_1.01,1.0062335968017577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,1,power_law_1.01,1.010707187652588
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,1,power_law_1.2,0.9815103530883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,1,power_law_1.2,0.9939647674560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,128,balanced,0.1049173374970754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,128,balanced,0.10923199852307637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,128,power_law_1.01,0.0951744019985199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,128,power_law_1.01,0.09891200065612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,128,power_law_1.2,0.09626240134239197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,128,power_law_1.2,0.09720320105552674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,16,balanced,0.12729600071907043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,16,balanced,0.12811733285586038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,16,power_law_1.01,0.11196160316467285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,16,power_law_1.01,0.11274240016937256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,16,power_law_1.2,0.10643199682235718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,16,power_law_1.2,0.10691839456558228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,2,balanced,0.6895093123118082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,2,balanced,0.6899200280507406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,2,power_law_1.01,0.5485951900482178
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,2,power_law_1.01,0.5797440052032471
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,2,power_law_1.2,0.5356416225433349
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,2,power_law_1.2,0.540012788772583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,32,balanced,0.12427199880282085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,32,balanced,0.12683199842770895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,32,power_law_1.01,0.10111360549926758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,32,power_law_1.01,0.10373120307922364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,32,power_law_1.2,0.09713280200958252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,32,power_law_1.2,0.1085055947303772
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,4,balanced,0.36396265029907227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,4,balanced,0.36450668176015216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,4,power_law_1.01,0.30213758945465086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,4,power_law_1.01,0.33124480247497556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,4,power_law_1.2,0.2739903926849365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,4,power_law_1.2,0.3027008056640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,64,balanced,0.2007733384768168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,64,balanced,0.20357332626978555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,64,power_law_1.01,0.17293440103530883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,64,power_law_1.01,0.18328959941864015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,64,power_law_1.2,0.1757375955581665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,64,power_law_1.2,0.17623039484024047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,8,balanced,0.2030186653137207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,8,balanced,0.20430399974187216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,8,power_law_1.01,0.17428480386734008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,8,power_law_1.01,0.18793599605560302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,8,power_law_1.2,0.15996160507202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,1,8,power_law_1.2,0.17237759828567506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,16,1,balanced,0.16697067022323608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,16,1,balanced,0.16702934106191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,16,1,power_law_1.01,0.14214400053024293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,16,1,power_law_1.01,0.14264960289001466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,16,1,power_law_1.2,0.14143999814987182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,16,1,power_law_1.2,0.14158719778060913
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,2,1,balanced,0.6919413407643636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,2,1,balanced,0.6930027008056641
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,2,1,power_law_1.01,0.5227839946746826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,2,1,power_law_1.01,0.5276800155639648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,2,1,power_law_1.2,0.5084352016448974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,2,1,power_law_1.2,0.5135807991027832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,32,1,balanced,0.13682132959365845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,32,1,balanced,0.13806933164596558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,32,1,power_law_1.01,0.12327680587768555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,32,1,power_law_1.01,0.12387200593948364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,32,1,power_law_1.2,0.12031999826431275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,32,1,power_law_1.2,0.12181119918823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,4,1,balanced,0.3708639939626058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,4,1,balanced,0.37170132001241046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,4,1,power_law_1.01,0.29018239974975585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,4,1,power_law_1.01,0.29171841144561766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,4,1,power_law_1.2,0.28635520935058595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,4,1,power_law_1.2,0.28828160762786864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,8,1,balanced,0.2235893408457438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,8,1,balanced,0.22373332579930624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,8,1,power_law_1.01,0.18355200290679932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,8,1,power_law_1.01,0.18436479568481445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,8,1,power_law_1.2,0.17992960214614867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,128,7168,2048,8,384,8,1,power_law_1.2,0.1823807954788208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,1,balanced,0.1646666626135508
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,1,balanced,0.1662560005982717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,1,power_law_1.01,0.14807679653167724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,1,power_law_1.01,0.14895360469818114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,1,power_law_1.2,0.15229439735412598
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,1,power_law_1.2,0.15237120389938355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,128,balanced,0.04593066871166229
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,128,balanced,0.04597333570321401
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,128,power_law_1.01,0.045638400316238406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,128,power_law_1.01,0.046412798762321475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,128,power_law_1.2,0.04705919921398163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,128,power_law_1.2,0.047328001260757445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,16,balanced,0.04785066843032837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,16,balanced,0.04791999856630961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,16,power_law_1.01,0.05258880257606506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,16,power_law_1.01,0.054425597190856934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,16,power_law_1.2,0.05310720205307007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,16,power_law_1.2,0.05438079833984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,2,balanced,0.0959999958674113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,2,balanced,0.09705600142478943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,2,power_law_1.01,0.10755200386047363
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,2,power_law_1.01,0.10901119709014892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,2,power_law_1.2,0.11070719957351685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,2,power_law_1.2,0.11379200220108032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,32,balanced,0.04654400050640106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,32,balanced,0.04779199759165446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,32,power_law_1.01,0.048851200938224794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,32,power_law_1.01,0.0493120014667511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,32,power_law_1.2,0.04938879907131195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,32,power_law_1.2,0.05196800231933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,4,balanced,0.07051200171311696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,4,balanced,0.07113066812356313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,4,power_law_1.01,0.0796288013458252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,4,power_law_1.01,0.08414080142974853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,4,power_law_1.2,0.0822272002696991
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,4,power_law_1.2,0.08261119723320007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,64,balanced,0.045968001087506614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,64,balanced,0.04781333108743032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,64,power_law_1.01,0.046367999911308286
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,64,power_law_1.01,0.04764800071716309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,64,power_law_1.2,0.047737601399421695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,64,power_law_1.2,0.04805119931697845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,8,balanced,0.05351466437180837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,8,balanced,0.05414933462937673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,8,power_law_1.01,0.06178560256958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,8,power_law_1.01,0.06273279786109924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,8,power_law_1.2,0.06197119951248169
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,1,8,power_law_1.2,0.06439679861068726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,2,1,balanced,0.10797333717346191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,2,1,balanced,0.10824533303578694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,2,1,power_law_1.01,0.10280959606170655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,2,1,power_law_1.01,0.10334080457687378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,2,1,power_law_1.2,0.10329600572586059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,4,1,balanced,0.09994666775067647
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,4,1,balanced,0.1013759970664978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,4,1,power_law_1.01,0.09355520009994507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,4,1,power_law_1.01,0.0941760003566742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,4,1,power_law_1.2,0.09393280148506164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,2048,768,8,128,4,1,power_law_1.2,0.09415040016174317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,1,balanced,0.4270506699879964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,1,balanced,0.43086934089660645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,1,power_law_1.01,0.44831361770629885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,1,power_law_1.01,0.4533504009246826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,1,power_law_1.2,0.4696767807006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,1,power_law_1.2,0.4750016212463379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,128,balanced,0.053727999329566956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,128,balanced,0.05385066568851471
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,128,power_law_1.01,0.05369600057601929
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,128,power_law_1.01,0.05413119792938233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,128,power_law_1.2,0.055801600217819214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,128,power_law_1.2,0.056505602598190305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,16,balanced,0.08043733239173889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,16,balanced,0.08097599943478902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,16,power_law_1.01,0.08372480273246766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,16,power_law_1.01,0.08498560190200806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,16,power_law_1.2,0.08654080033302307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,16,power_law_1.2,0.08732799887657165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,2,balanced,0.21589332818984985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,2,balanced,0.21591466665267944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,2,power_law_1.01,0.23037440776824952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,2,power_law_1.01,0.232857608795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,2,power_law_1.2,0.24022400379180908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,2,power_law_1.2,0.24736640453338624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,256,balanced,0.05384533107280731
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,256,balanced,0.05389333268006643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,256,power_law_1.01,0.052275198698043826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,256,power_law_1.01,0.0523967981338501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,256,power_law_1.2,0.05372160077095032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,256,power_law_1.2,0.05432320237159729
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,32,balanced,0.06482133269309998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,32,balanced,0.06670933465162913
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,32,power_law_1.01,0.0694208025932312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,32,power_law_1.01,0.07107840180397033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,32,power_law_1.2,0.07129600048065185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,32,power_law_1.2,0.07263360023498536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,4,balanced,0.2480000058809916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,4,balanced,0.2496053377787272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,4,power_law_1.01,0.18611840009689332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,4,power_law_1.01,0.18962559700012208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,4,power_law_1.2,0.19769599437713622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,4,power_law_1.2,0.20396800041198732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,64,balanced,0.05427733560403188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,64,balanced,0.05551999807357788
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,64,power_law_1.01,0.058374398946762086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,64,power_law_1.01,0.06182399988174438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,64,power_law_1.2,0.06033920049667359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,64,power_law_1.2,0.06125440001487732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,8,balanced,0.10291733344395955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,8,balanced,0.10745599865913391
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,8,power_law_1.01,0.10424319505691529
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,8,power_law_1.01,0.10826879739761353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,8,power_law_1.2,0.11224960088729859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,1,8,power_law_1.2,0.11423360109329224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,2,1,balanced,0.258730669816335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,2,1,balanced,0.25914132595062256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,2,1,power_law_1.01,0.26933119297027586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,2,1,power_law_1.01,0.27426559925079347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,2,1,power_law_1.2,0.281062388420105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,2,1,power_law_1.2,0.2823296070098877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,4,1,balanced,0.18096532424290976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,4,1,balanced,0.18104533354441324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,4,1,power_law_1.01,0.1820672035217285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,4,1,power_law_1.01,0.1831936001777649
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,4,1,power_law_1.2,0.18796160221099853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,4,1,power_law_1.2,0.18900480270385742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,8,1,balanced,0.14410666624704996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,8,1,balanced,0.14565333724021912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,8,1,power_law_1.01,0.1424831986427307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,8,1,power_law_1.01,0.14351999759674072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,8,1,power_law_1.2,0.14588160514831544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,3072,1536,8,256,8,1,power_law_1.2,0.14737919569015503
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,1,balanced,0.3707786798477173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,1,balanced,0.37116265296936035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,1,power_law_1.01,0.43337597846984866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,1,power_law_1.01,0.4494272232055664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,1,power_law_1.2,0.4369664192199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,1,power_law_1.2,0.4415487766265869
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,2,balanced,0.2168160080909729
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,2,balanced,0.21738133827845255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,2,power_law_1.01,0.29758079051971437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,2,power_law_1.01,0.29947519302368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,2,power_law_1.2,0.31916160583496095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,2,power_law_1.2,0.32517759799957274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,4,balanced,0.14727999766667685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,4,balanced,0.14832533399264017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,4,power_law_1.01,0.22117118835449218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,4,power_law_1.01,0.2555775880813599
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,4,power_law_1.2,0.22417280673980713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,4,power_law_1.2,0.2311552047729492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,8,balanced,0.10393066207567851
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,8,balanced,0.10405866305033366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,8,power_law_1.01,0.18391040563583375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,8,power_law_1.01,0.1846400022506714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,8,power_law_1.2,0.1856384038925171
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,1,8,power_law_1.2,0.1949504017829895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,16,1,balanced,0.08277333279450734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,16,1,balanced,0.08296533425649007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,16,1,power_law_1.01,0.08362879753112792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,16,1,power_law_1.01,0.08402559757232667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,16,1,power_law_1.2,0.08271999955177307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,16,1,power_law_1.2,0.0847487986087799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,2,1,balanced,0.21318399906158447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,2,1,balanced,0.21357866128285727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,2,1,power_law_1.01,0.24414079189300536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,2,1,power_law_1.01,0.25388801097869873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,2,1,power_law_1.2,0.24160640239715575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,2,1,power_law_1.2,0.25520639419555663
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,32,1,balanced,0.07239999870459239
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,32,1,balanced,0.07242666681607564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,32,1,power_law_1.01,0.07170559763908387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,32,1,power_law_1.01,0.07306240200996399
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,32,1,power_law_1.2,0.07322239875793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,32,1,power_law_1.2,0.0735871970653534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,4,1,balanced,0.14129599928855896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,4,1,balanced,0.141375998655955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,4,1,power_law_1.01,0.1500991940498352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,4,1,power_law_1.01,0.15294719934463502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,4,1,power_law_1.2,0.15509120225906373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,4,1,power_law_1.2,0.16313600540161133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,8,1,balanced,0.10038399696350098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,8,1,balanced,0.10116266210873921
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,8,1,power_law_1.01,0.10695680379867553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,8,1,power_law_1.01,0.10826239585876465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,8,1,power_law_1.2,0.10940799713134766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,14336,2,8,8,1,power_law_1.2,0.11194239854812622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,1,balanced,0.43457067012786865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,1,balanced,0.4381706714630127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,1,power_law_1.01,0.37684481143951415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,1,power_law_1.01,0.38134400844573973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,1,power_law_1.2,0.38694400787353517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,1,power_law_1.2,0.3886080026626587
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,128,balanced,0.059215997656186424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,128,balanced,0.05994133154551188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,128,power_law_1.01,0.06027519702911377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,128,power_law_1.01,0.060710400342941284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,128,power_law_1.2,0.06750720143318176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,128,power_law_1.2,0.06753919720649719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,16,balanced,0.07976533472537994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,16,balanced,0.08000533282756805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,16,power_law_1.01,0.08595200181007386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,16,power_law_1.01,0.09151359796524047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,16,power_law_1.2,0.09394559860229493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,16,power_law_1.2,0.09599999785423279
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,2,balanced,0.2311306595802307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,2,balanced,0.23122133811314902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,2,power_law_1.01,0.22547199726104736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,2,power_law_1.01,0.23326079845428466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,2,power_law_1.2,0.22987520694732666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,2,power_law_1.2,0.2393343925476074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,32,balanced,0.06306666632493337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,32,balanced,0.06432533264160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,32,power_law_1.01,0.07416319847106934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,32,power_law_1.01,0.07869439721107482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,32,power_law_1.2,0.07868800163269044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,32,power_law_1.2,0.08015999794006348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,4,balanced,0.12504000465075174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,4,balanced,0.12573333581288657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,4,power_law_1.01,0.15563520193099975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,4,power_law_1.01,0.17622400522232057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,4,power_law_1.2,0.17859840393066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,4,power_law_1.2,0.18149759769439697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,64,balanced,0.05950400233268738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,64,balanced,0.05964266757170359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,64,power_law_1.01,0.06686080098152161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,64,power_law_1.01,0.06935039758682252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,64,power_law_1.2,0.06933119893074036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,64,power_law_1.2,0.06933760046958923
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,8,balanced,0.09515733520189922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,8,balanced,0.09559466441472371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,8,power_law_1.01,0.1056447982788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,8,power_law_1.01,0.10662399530410767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,8,power_law_1.2,0.11493760347366333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,1,8,power_law_1.2,0.11756800413131714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,2,1,balanced,0.2765760024388631
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,2,1,balanced,0.28219733635584515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,2,1,power_law_1.01,0.24336640834808348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,2,1,power_law_1.01,0.24606080055236818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,2,1,power_law_1.2,0.2532543897628784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,2,1,power_law_1.2,0.25345919132232664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,4,1,balanced,0.17898666858673096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,4,1,balanced,0.1815626621246338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,4,1,power_law_1.01,0.1645311951637268
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,4,1,power_law_1.01,0.16491520404815674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,4,1,power_law_1.2,0.16658560037612916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,4,1,power_law_1.2,0.1676095962524414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,8,1,balanced,0.1565013329188029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,8,1,balanced,0.15687466661135355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,8,1,power_law_1.01,0.15104000568389891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,8,1,power_law_1.01,0.1569983959197998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,8,1,power_law_1.2,0.15502079725265502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,4096,1536,8,128,8,1,power_law_1.2,0.164518404006958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,1,balanced,0.6421440045038859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,1,balanced,0.6452213525772095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,1,power_law_1.01,0.8113151550292969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,1,power_law_1.01,0.8504768371582031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,1,power_law_1.2,0.767910385131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,1,power_law_1.2,0.8252799987792969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,2,balanced,0.3386133511861165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,2,balanced,0.3397226730982463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,2,power_law_1.01,0.46519041061401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,2,power_law_1.01,0.5082623958587646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,2,power_law_1.2,0.5175615787506104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,2,power_law_1.2,0.5334208011627197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,4,balanced,0.20132799943288168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,4,balanced,0.20318400859832764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,4,power_law_1.01,0.3804352045059204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,4,power_law_1.01,0.41132159233093263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,4,power_law_1.2,0.3846463918685913
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,4,power_law_1.2,0.3873600006103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,8,balanced,0.1381333371003469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,8,balanced,0.14062399665514627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,8,power_law_1.01,0.2765568017959595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,8,power_law_1.01,0.3235840082168579
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,8,power_law_1.2,0.3135807991027832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,1,8,power_law_1.2,0.322489595413208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,16,1,balanced,0.10487467050552368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,16,1,balanced,0.10680533448855083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,16,1,power_law_1.01,0.11441919803619385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,16,1,power_law_1.01,0.1147968053817749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,16,1,power_law_1.2,0.1139456033706665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,16,1,power_law_1.2,0.11469440460205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,2,1,balanced,0.3145013252894084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,2,1,balanced,0.316922664642334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,2,1,power_law_1.01,0.3693631887435913
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,2,1,power_law_1.01,0.3952768087387085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,2,1,power_law_1.2,0.358188796043396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,2,1,power_law_1.2,0.37544960975646974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,32,1,balanced,0.0939520001411438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,32,1,balanced,0.0942080020904541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,32,1,power_law_1.01,0.09403520226478576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,32,1,power_law_1.01,0.09474560022354125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,32,1,power_law_1.2,0.09363840222358703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,32,1,power_law_1.2,0.09370239973068237
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,4,1,balanced,0.1979573369026184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,4,1,balanced,0.1982240080833435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,4,1,power_law_1.01,0.23144960403442383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,4,1,power_law_1.01,0.24074239730834962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,4,1,power_law_1.2,0.22684800624847412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,4,1,power_law_1.2,0.23267199993133544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,8,1,balanced,0.1388159990310669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,8,1,balanced,0.13915733496348062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,8,1,power_law_1.01,0.14948480129241942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,8,1,power_law_1.01,0.15635199546813966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,8,1,power_law_1.2,0.15086079835891725
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,16384,2,8,8,1,power_law_1.2,0.15334399938583373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,1,balanced,1.0491306781768799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,1,balanced,1.0534026622772217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,1,power_law_1.01,1.1141056060791015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,1,power_law_1.01,1.1180864334106446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,1,power_law_1.2,1.175539207458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,1,power_law_1.2,1.1755840301513671
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,128,balanced,0.0774186650911967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,128,balanced,0.07880533238252004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,128,power_law_1.01,0.08720639944076539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,128,power_law_1.01,0.08966400027275086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,128,power_law_1.2,0.09205120205879211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,128,power_law_1.2,0.09258239865303039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,16,balanced,0.13595733046531677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,16,balanced,0.1381013294061025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,16,power_law_1.01,0.14149760007858275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,16,power_law_1.01,0.1425920009613037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,16,power_law_1.2,0.14940160512924194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,16,power_law_1.2,0.1511680006980896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,2,balanced,0.4869973262151082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,2,balanced,0.48822398980458576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,2,power_law_1.01,0.5356607913970948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,2,power_law_1.01,0.5423168182373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,2,power_law_1.2,0.5759168148040772
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,2,power_law_1.2,0.5872191905975341
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,256,balanced,0.07256000240643819
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,256,balanced,0.07261333366235097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,256,power_law_1.01,0.07457280158996582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,256,power_law_1.01,0.07639679908752442
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,256,power_law_1.2,0.08095999956130981
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,256,power_law_1.2,0.08522239923477173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,32,balanced,0.1081119974454244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,32,balanced,0.10844799876213074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,32,power_law_1.01,0.11242239475250244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,32,power_law_1.01,0.11525119543075561
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,32,power_law_1.2,0.1158336043357849
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,32,power_law_1.2,0.11627520322799682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,4,balanced,0.4910293420155843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,4,balanced,0.4918400049209595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,4,power_law_1.01,0.3467072010040283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,4,power_law_1.01,0.41103358268737794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,4,power_law_1.2,0.37674241065979003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,4,power_law_1.2,0.3966655969619751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,64,balanced,0.09124267101287842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,64,balanced,0.09178133805592854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,64,power_law_1.01,0.0970304012298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,64,power_law_1.01,0.09829760193824769
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,64,power_law_1.2,0.09944959878921508
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,64,power_law_1.2,0.10144000053405762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,8,balanced,0.19610132773717245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,8,balanced,0.19612266620000204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,8,power_law_1.01,0.19719680547714233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,8,power_law_1.01,0.19990400075912476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,8,power_law_1.2,0.21368958950042724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,1,8,power_law_1.2,0.21811199188232422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,16,1,balanced,0.2222506602605184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,16,1,balanced,0.22285866737365723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,16,1,power_law_1.01,0.2257983922958374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,16,1,power_law_1.01,0.22688000202178954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,16,1,power_law_1.2,0.22947840690612792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,16,1,power_law_1.2,0.23016960620880128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,2,1,balanced,0.5754986604054769
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,2,1,balanced,0.5762773354848226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,2,1,power_law_1.01,0.6067391872406006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,2,1,power_law_1.01,0.6105472087860108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,2,1,power_law_1.2,0.6369664192199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,2,1,power_law_1.2,0.6375360012054443
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,32,1,balanced,0.20365333557128906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,32,1,balanced,0.20433066288630167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,32,1,power_law_1.01,0.2049855947494507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,32,1,power_law_1.01,0.2052992105484009
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,32,1,power_law_1.2,0.2067903995513916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,32,1,power_law_1.2,0.2071552038192749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,4,1,balanced,0.3627893527348836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,4,1,balanced,0.36287466684977215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,4,1,power_law_1.01,0.3715903997421265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,4,1,power_law_1.01,0.37241599559783933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,4,1,power_law_1.2,0.3834815979003906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,4,1,power_law_1.2,0.38945279121398924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,8,1,balanced,0.26310932636260986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,8,1,balanced,0.2635200023651123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,8,1,power_law_1.01,0.2666239976882935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,8,1,power_law_1.01,0.2673856019973755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,8,1,power_law_1.2,0.2733439922332764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2048,8,256,8,1,power_law_1.2,0.27761919498443605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,1,balanced,1.2967466513315837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,1,balanced,1.3142133553822835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,1,power_law_1.01,0.9404288291931152
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,1,power_law_1.01,0.9497088432312012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,1,power_law_1.2,0.9826687812805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,1,power_law_1.2,0.9844672203063964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,16,balanced,0.12197867035865784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,16,balanced,0.12304533521334331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,16,power_law_1.01,0.14169600009918212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,16,power_law_1.01,0.1445312023162842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,16,power_law_1.2,0.1534208059310913
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,16,power_law_1.2,0.15508480072021485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,2,balanced,0.687274694442749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,2,balanced,0.6892853577931722
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,2,power_law_1.01,0.6063744068145752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,2,power_law_1.01,0.6404160022735595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,2,power_law_1.2,0.5631423950195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,2,power_law_1.2,0.605836820602417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,32,balanced,0.10150933265686035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,32,balanced,0.10266133149464925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,32,power_law_1.01,0.1158336043357849
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,32,power_law_1.01,0.11911040544509888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,32,power_law_1.2,0.12106239795684814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,32,power_law_1.2,0.12289279699325562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,4,balanced,0.2495786746342977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,4,balanced,0.2502506573994954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,4,power_law_1.01,0.3109888076782227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,4,power_law_1.01,0.33742079734802244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,4,power_law_1.2,0.3359488010406494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,4,power_law_1.2,0.3568128108978271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,8,balanced,0.16452266772588095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,8,balanced,0.1646613379319509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,8,power_law_1.01,0.19714560508728027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,8,power_law_1.01,0.2016767978668213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,8,power_law_1.2,0.20896639823913574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,1,8,power_law_1.2,0.21326720714569092
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,2,1,balanced,0.7163039843241373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,2,1,balanced,0.7185920079549154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,2,1,power_law_1.01,0.5374080181121826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,2,1,power_law_1.01,0.5421440124511718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,2,1,power_law_1.2,0.5528895854949951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,2,1,power_law_1.2,0.5588223934173584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,4,1,balanced,0.45527998606363934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,4,1,balanced,0.49666134516398114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,4,1,power_law_1.01,0.3556288003921509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,4,1,power_law_1.01,0.3836159944534302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,4,1,power_law_1.2,0.3650304079055786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,4,1,power_law_1.2,0.3665791988372803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,8,1,balanced,0.29959466060002643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,8,1,balanced,0.3063039978345235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,8,1,power_law_1.01,0.24747519493103026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,8,1,power_law_1.01,0.2500096082687378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,8,1,power_law_1.2,0.2546880006790161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,6144,2560,8,160,8,1,power_law_1.2,0.2552704095840454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,1,balanced,1.2155253092447917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,1,balanced,1.238421360651652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,1,power_law_1.01,1.2889344215393066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,1,power_law_1.01,1.315244770050049
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,1,power_law_1.2,1.3789759635925294
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,1,power_law_1.2,1.384166431427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,128,balanced,0.09085333347320557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,128,balanced,0.09105599919954936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,128,power_law_1.01,0.09413120150566101
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,128,power_law_1.01,0.09713919758796692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,128,power_law_1.2,0.10173439979553223
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,128,power_law_1.2,0.1021183967590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,16,balanced,0.15405333042144775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,16,balanced,0.15665599703788757
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,16,power_law_1.01,0.15852160453796388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,16,power_law_1.01,0.16419199705123902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,16,power_law_1.2,0.16444159746170045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,16,power_law_1.2,0.17114239931106567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,2,balanced,0.5650879939397176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,2,balanced,0.5659679969151815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,2,power_law_1.01,0.6208640098571777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,2,power_law_1.01,0.6282303810119629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,2,power_law_1.2,0.6620351791381835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,2,power_law_1.2,0.6770815849304199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,256,balanced,0.08131200075149536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,256,balanced,0.08156266808509827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,256,power_law_1.01,0.08677759766578674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,256,power_law_1.01,0.08750079870223999
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,256,power_law_1.2,0.09484800100326538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,256,power_law_1.2,0.09559680223464966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,32,balanced,0.12079466382662456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,32,balanced,0.12294933199882507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,32,power_law_1.01,0.12183680534362792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,32,power_law_1.01,0.12673920392990112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,32,power_law_1.2,0.1320639967918396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,32,power_law_1.2,0.13530240058898926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,4,balanced,0.5610880057017008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,4,balanced,0.5628213485081991
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,4,power_law_1.01,0.43523201942443845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,4,power_law_1.01,0.4419839859008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,4,power_law_1.2,0.4212224006652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,4,power_law_1.2,0.4488639831542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,64,balanced,0.09987200299898784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,64,balanced,0.10274666547775269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,64,power_law_1.01,0.10638079643249512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,64,power_law_1.01,0.10729600191116333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,64,power_law_1.2,0.10872960090637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,64,power_law_1.2,0.11450879573822022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,8,balanced,0.2179786761601766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,8,balanced,0.21884800990422568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,8,power_law_1.01,0.2265023946762085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,8,power_law_1.01,0.23023359775543212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,8,power_law_1.2,0.2392319917678833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,1,8,power_law_1.2,0.25613439083099365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,16,1,balanced,0.25473066171010333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,16,1,balanced,0.2547626694043477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,16,1,power_law_1.01,0.2608896017074585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,16,1,power_law_1.01,0.2610687971115112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,16,1,power_law_1.2,0.2636480093002319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,16,1,power_law_1.2,0.2657344102859497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,2,1,balanced,0.6682613690694174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,2,1,balanced,0.668842633565267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,2,1,power_law_1.01,0.7020800113677979
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,2,1,power_law_1.01,0.7048831939697265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,2,1,power_law_1.2,0.7368127822875976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,2,1,power_law_1.2,0.7449920177459717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,32,1,balanced,0.23438400030136108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,32,1,balanced,0.23504533370335898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,32,1,power_law_1.01,0.23410561084747314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,32,1,power_law_1.01,0.23441920280456544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,32,1,power_law_1.2,0.2373055934906006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,32,1,power_law_1.2,0.23965439796447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,4,1,balanced,0.42029333114624023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,4,1,balanced,0.4220106601715088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,4,1,power_law_1.01,0.42863998413085935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,4,1,power_law_1.01,0.4310783863067627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,4,1,power_law_1.2,0.44752001762390137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,4,1,power_law_1.2,0.45165438652038575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,8,1,balanced,0.3030933340390523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,8,1,balanced,0.3032426635424296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,8,1,power_law_1.01,0.30870399475097654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,8,1,power_law_1.01,0.30979199409484864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,8,1,power_law_1.2,0.31704959869384763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,256,8,1,power_law_1.2,0.3178368091583252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,1,balanced,1.6389013926188152
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,1,balanced,1.7505653699239094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,1,power_law_1.01,1.9175935745239259
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,1,power_law_1.01,1.9523136138916015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,1,power_law_1.2,2.03110408782959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,1,power_law_1.2,2.0428607940673826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,128,balanced,0.09507200121879578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,128,balanced,0.09537600477536519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,128,power_law_1.01,0.09921919703483581
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,128,power_law_1.01,0.10102399587631225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,128,power_law_1.2,0.10252159833908081
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,128,power_law_1.2,0.10497920513153076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,16,balanced,0.1860640048980713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,16,balanced,0.18837867180506387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,16,power_law_1.01,0.18610559701919555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,16,power_law_1.01,0.18706560134887695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,16,power_law_1.2,0.1844480037689209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,16,power_law_1.2,0.20349440574645997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,2,balanced,0.7750399907430013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,2,balanced,0.7752373218536377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,2,power_law_1.01,0.8343232154846192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,2,power_law_1.01,0.8755135536193848
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,2,power_law_1.2,0.8877823829650879
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,2,power_law_1.2,0.8929216384887695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,32,balanced,0.13607466220855713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,32,balanced,0.1376586655775706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,32,power_law_1.01,0.13295359611511232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,32,power_law_1.01,0.13653759956359862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,32,power_law_1.2,0.1435647964477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,32,power_law_1.2,0.1439743995666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,4,balanced,0.4434080123901367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,4,balanced,0.44413332144419354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,4,power_law_1.01,0.4498752117156982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,4,power_law_1.01,0.4633344173431396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,4,power_law_1.2,0.4609983921051025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,4,power_law_1.2,0.46883201599121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,64,balanced,0.11345066626866658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,64,balanced,0.11396267016728719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,64,power_law_1.01,0.1082751989364624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,64,power_law_1.01,0.11200640201568604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,64,power_law_1.2,0.11277439594268798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,64,power_law_1.2,0.1159168004989624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,8,balanced,0.3558559815088908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,8,balanced,0.3588053385416667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,8,power_law_1.01,0.3216576099395752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,8,power_law_1.01,0.3329279899597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,8,power_law_1.2,0.3445568084716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,1,8,power_law_1.2,0.3482752084732056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,16,1,balanced,0.31561599175135296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,16,1,balanced,0.3168479998906453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,16,1,power_law_1.01,0.3467200040817261
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,16,1,power_law_1.01,0.34882559776306155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,16,1,power_law_1.2,0.3515968084335327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,16,1,power_law_1.2,0.3516031980514526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,2,1,balanced,0.8888373374938965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,2,1,balanced,0.8970346450805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,2,1,power_law_1.01,1.0072192192077636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,2,1,power_law_1.01,1.0082880020141602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,2,1,power_law_1.2,1.0590720176696777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,2,1,power_law_1.2,1.0674752235412597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,32,1,balanced,0.2861280043919881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,32,1,balanced,0.2862933278083801
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,32,1,power_law_1.01,0.31076478958129883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,32,1,power_law_1.01,0.31139841079711916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,32,1,power_law_1.2,0.3150079965591431
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,32,1,power_law_1.2,0.31515519618988036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,4,1,balanced,0.5414666732152303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,4,1,balanced,0.5429226557413737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,4,1,power_law_1.01,0.5954944133758545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,4,1,power_law_1.01,0.5988863945007324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,4,1,power_law_1.2,0.6220352172851562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,4,1,power_law_1.2,0.625926399230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,8,1,balanced,0.37965333461761475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,8,1,balanced,0.3800160090128581
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,8,1,power_law_1.01,0.4155456066131592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,8,1,power_law_1.01,0.41646718978881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,8,1,power_law_1.2,0.4264832019805908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,1536,7168,2048,8,384,8,1,power_law_1.2,0.42970881462097166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,1,balanced,0.07818666597207387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,1,balanced,0.07828266421953838
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,1,power_law_1.01,0.053491199016571046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,1,power_law_1.01,0.05415679812431336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,1,power_law_1.2,0.052243202924728394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,1,power_law_1.2,0.053388798236846925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,128,balanced,0.02587733417749405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,128,balanced,0.02749866743882497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,128,power_law_1.01,0.025043201446533204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,128,power_law_1.01,0.026547199487686156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,128,power_law_1.2,0.02447360008955002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,128,power_law_1.2,0.025119999051094057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,16,balanced,0.027215999861558277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,16,balanced,0.027242665489514668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,16,power_law_1.01,0.024454399943351746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,16,power_law_1.01,0.02502399981021881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,16,power_law_1.2,0.02470400035381317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,16,power_law_1.2,0.02534399926662445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,2,balanced,0.05435733497142792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,2,balanced,0.055589333176612854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,2,power_law_1.01,0.038022398948669434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,2,power_law_1.01,0.03945600092411041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,2,power_law_1.2,0.038176000118255615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,2,power_law_1.2,0.03930880129337311
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,32,balanced,0.025648000339667004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,32,balanced,0.027301333844661713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,32,power_law_1.01,0.024223999679088594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,32,power_law_1.01,0.02459519952535629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,32,power_law_1.2,0.023206399381160737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,32,power_law_1.2,0.02388480007648468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,4,balanced,0.03324266771475474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,4,balanced,0.036602665980656944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,4,power_law_1.01,0.029926401376724244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,4,power_law_1.01,0.03115519881248474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,4,power_law_1.2,0.029190400242805482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,4,power_law_1.2,0.029900801181793214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,64,balanced,0.025472000241279602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,64,balanced,0.02749866743882497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,64,power_law_1.01,0.024454399943351746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,64,power_law_1.01,0.02568959891796112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,64,power_law_1.2,0.023756800591945647
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,64,power_law_1.2,0.023929600417613984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,8,balanced,0.02926933268706004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,8,balanced,0.029391999046007793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,8,power_law_1.01,0.025721600651741026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,8,power_law_1.01,0.0262719988822937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,8,power_law_1.2,0.027327999472618103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,1,8,power_law_1.2,0.027904000878334046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,2,1,balanced,0.05609600245952606
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,2,1,balanced,0.05704533557097117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,2,1,power_law_1.01,0.03847039937973022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,2,1,power_law_1.01,0.03885439932346344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,2,1,power_law_1.2,0.035622400045394895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,2,1,power_law_1.2,0.03694719970226288
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,4,1,balanced,0.03766933331886927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,4,1,balanced,0.03880000114440918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,4,1,power_law_1.01,0.029580798745155335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,4,1,power_law_1.01,0.03030399978160858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,4,1,power_law_1.2,0.030003198981285097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,2048,768,8,128,4,1,power_law_1.2,0.03028480112552643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,1,balanced,0.16953066984812418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,1,balanced,0.17093332608540854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,1,power_law_1.01,0.13501440286636351
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,1,power_law_1.01,0.13672319650650025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,1,power_law_1.2,0.12163200378417968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,1,power_law_1.2,0.12462719678878784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,128,balanced,0.025349333882331848
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,128,balanced,0.027295999228954315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,128,power_law_1.01,0.025337600708007814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,128,power_law_1.01,0.025676798820495606
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,128,power_law_1.2,0.02476159930229187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,128,power_law_1.2,0.025094398856163026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,16,balanced,0.03156266609827677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,16,balanced,0.03186666717131933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,16,power_law_1.01,0.04384639859199524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,16,power_law_1.01,0.046316799521446225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,16,power_law_1.2,0.0453247994184494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,16,power_law_1.2,0.047353601455688475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,2,balanced,0.10065066814422607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,2,balanced,0.10248532891273499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,2,power_law_1.01,0.09098880290985108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,2,power_law_1.01,0.09255679845809936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,2,power_law_1.2,0.07948799729347229
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,2,power_law_1.2,0.08561919927597046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,256,balanced,0.029306667546431225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,256,balanced,0.029365333418051403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,256,power_law_1.01,0.02654080092906952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,256,power_law_1.01,0.027046400308609008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,256,power_law_1.2,0.025920000672340394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,256,power_law_1.2,0.02656640112400055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,32,balanced,0.027493332823117573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,32,balanced,0.02926933268706004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,32,power_law_1.01,0.027929601073265076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,32,power_law_1.01,0.030476799607276915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,32,power_law_1.2,0.02887679934501648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,32,power_law_1.2,0.029824000597000123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,4,balanced,0.06634666522343953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,4,balanced,0.06648533542950948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,4,power_law_1.01,0.06878719925880432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,4,power_law_1.01,0.06970239877700805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,4,power_law_1.2,0.06244480013847351
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,4,power_law_1.2,0.066457599401474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,64,balanced,0.027221334477265675
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,64,balanced,0.02754666656255722
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,64,power_law_1.01,0.025593599677085875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,64,power_law_1.01,0.02746880054473877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,64,power_law_1.2,0.026636800169944762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,64,power_law_1.2,0.02685439884662628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,8,balanced,0.04712533454100291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,8,balanced,0.048528000712394714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,8,power_law_1.01,0.05991680026054382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,8,power_law_1.01,0.060108798742294314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,8,power_law_1.2,0.055302399396896365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,1,8,power_law_1.2,0.05987840294837952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,2,1,balanced,0.10366933544476827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,2,1,balanced,0.10452266534169515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,2,1,power_law_1.01,0.08338559865951538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,2,1,power_law_1.01,0.08503680229187012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,2,1,power_law_1.2,0.07660160064697266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,2,1,power_law_1.2,0.07796480059623719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,4,1,balanced,0.06931733091672261
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,4,1,balanced,0.0693333347638448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,4,1,power_law_1.01,0.05585920214653015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,4,1,power_law_1.01,0.058220797777175905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,4,1,power_law_1.2,0.05497599840164184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,4,1,power_law_1.2,0.05544319748878479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,8,1,balanced,0.05372266471385956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,8,1,balanced,0.0547626664241155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,8,1,power_law_1.01,0.04428800046443939
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,8,1,power_law_1.01,0.044409599900245664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,8,1,power_law_1.2,0.041247999668121337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,3072,1536,8,256,8,1,power_law_1.2,0.042854401469230655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,1,balanced,0.14019733667373657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,1,balanced,0.14056533575057983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,1,power_law_1.01,0.13959039449691774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,1,power_law_1.01,0.13960319757461548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,1,power_law_1.2,0.1349503993988037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,1,power_law_1.2,0.13733760118484498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,2,balanced,0.08472533027331035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,2,balanced,0.0860640009244283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,2,power_law_1.01,0.08243839740753174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,2,power_law_1.01,0.08372480273246766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,2,power_law_1.2,0.08668799996376038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,2,power_law_1.2,0.09095680117607116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,4,balanced,0.05956799785296122
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,4,balanced,0.060133333007494606
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,4,power_law_1.01,0.05978239774703979
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,4,power_law_1.01,0.0602944016456604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,4,power_law_1.2,0.058950400352478026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,4,power_law_1.2,0.060684800148010254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,8,balanced,0.04320000112056732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,8,balanced,0.04391466577847799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,8,power_law_1.01,0.04185599982738495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,8,power_law_1.01,0.04296959936618805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,8,power_law_1.2,0.04104959964752197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,1,8,power_law_1.2,0.04351359903812409
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,16,1,balanced,0.029472000896930695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,16,1,balanced,0.02956266701221466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,16,1,power_law_1.01,0.027603200078010558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,16,1,power_law_1.01,0.029407998919486998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,16,1,power_law_1.2,0.028364801406860353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,16,1,power_law_1.2,0.028575998544692994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,2,1,balanced,0.08477866649627686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,2,1,balanced,0.08610133330027263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,2,1,power_law_1.01,0.08133119940757752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,2,1,power_law_1.01,0.08358399868011475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,2,1,power_law_1.2,0.08217599987983704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,2,1,power_law_1.2,0.08513919711112976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,32,1,balanced,0.027029333015282948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,32,1,balanced,0.028549333413441975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,32,1,power_law_1.01,0.025465598702430724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,32,1,power_law_1.01,0.02730880081653595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,32,1,power_law_1.2,0.02730880081653595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,32,1,power_law_1.2,0.02768000066280365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,4,1,balanced,0.057999998331069946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,4,1,balanced,0.058186665177345276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,4,1,power_law_1.01,0.055289602279663085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,4,1,power_law_1.01,0.05596799850463867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,4,1,power_law_1.2,0.05592319965362549
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,4,1,power_law_1.2,0.05614079833030701
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,8,1,balanced,0.03788800040880839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,8,1,balanced,0.038202665746212006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,8,1,power_law_1.01,0.03837440013885498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,8,1,power_law_1.01,0.03887999951839447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,8,1,power_law_1.2,0.03688960075378418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,14336,2,8,8,1,power_law_1.2,0.03780480027198792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,1,balanced,0.2173866629600525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,1,balanced,0.21812800566355386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,1,power_law_1.01,0.1195520043373108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,1,power_law_1.01,0.12681599855422973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,1,power_law_1.2,0.11486719846725464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,1,power_law_1.2,0.11523200273513794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,128,balanced,0.029445332785447437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,128,balanced,0.031040000418821972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,128,power_law_1.01,0.028825598955154418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,128,power_law_1.01,0.02887679934501648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,128,power_law_1.2,0.02754560112953186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,128,power_law_1.2,0.028966400027275085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,16,balanced,0.0330079992612203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,16,balanced,0.03313066562016805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,16,power_law_1.01,0.030393600463867188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,16,power_law_1.01,0.031123200058937074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,16,power_law_1.2,0.03131519854068756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,16,power_law_1.2,0.031865599751472476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,2,balanced,0.12362133463223775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,2,balanced,0.12443733215332031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,2,power_law_1.01,0.07622399926185608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,2,power_law_1.01,0.08225280046463013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,2,power_law_1.2,0.08109440207481385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,2,power_law_1.2,0.08451840281486511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,32,balanced,0.029359998802344005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,32,balanced,0.02956799914439519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,32,power_law_1.01,0.027379199862480164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,32,power_law_1.01,0.02778240144252777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,32,power_law_1.2,0.0271807998418808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,32,power_law_1.2,0.02728320062160492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,4,balanced,0.07783466577529907
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,4,balanced,0.0783679982026418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,4,power_law_1.01,0.05937280058860779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,4,power_law_1.01,0.06309120059013366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,4,power_law_1.2,0.060083198547363284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,4,power_law_1.2,0.06222079992294312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,64,balanced,0.027349332968393963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,64,balanced,0.03018666555484136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,64,power_law_1.01,0.026719999313354493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,64,power_law_1.01,0.028748801350593566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,64,power_law_1.2,0.026662400364875792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,64,power_law_1.2,0.028646400570869444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,8,balanced,0.054560000697771706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,8,balanced,0.05593066910902659
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,8,power_law_1.01,0.04525440037250519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,8,power_law_1.01,0.046649599075317384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,8,power_law_1.2,0.03857280015945434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,1,8,power_law_1.2,0.050329601764678954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,2,1,balanced,0.1269973317782084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,2,1,balanced,0.12709866960843405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,2,1,power_law_1.01,0.0778432011604309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,2,1,power_law_1.01,0.08025599718093872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,2,1,power_law_1.2,0.0728384017944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,2,1,power_law_1.2,0.07287039756774902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,4,1,balanced,0.08055466910203297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,4,1,balanced,0.08237333099047343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,4,1,power_law_1.01,0.053990399837493895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,4,1,power_law_1.01,0.05538560152053833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,4,1,power_law_1.2,0.05287039875984192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,4,1,power_law_1.2,0.05454720258712768
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,8,1,balanced,0.06097066899140676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,8,1,balanced,0.06252266466617584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,8,1,power_law_1.01,0.04320000112056732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,8,1,power_law_1.01,0.04321280121803284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,8,1,power_law_1.2,0.03952000141143799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,4096,1536,8,128,8,1,power_law_1.2,0.040300801396369934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,1,balanced,0.2193546692530314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,1,balanced,0.2208426594734192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,1,power_law_1.01,0.21835520267486572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,1,power_law_1.01,0.22330238819122314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,1,power_law_1.2,0.2214400053024292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,1,power_law_1.2,0.2273792028427124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,2,balanced,0.12786133090655008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,2,balanced,0.12904533743858337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,2,power_law_1.01,0.12911360263824462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,2,power_law_1.01,0.13448959589004517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,2,power_law_1.2,0.1283903956413269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,2,power_law_1.2,0.1384768009185791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,4,balanced,0.078015998005867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,4,balanced,0.07884266475836436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,4,power_law_1.01,0.0833407998085022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,4,power_law_1.01,0.08491520285606384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,4,power_law_1.2,0.08181120157241821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,4,power_law_1.2,0.08353919982910156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,8,balanced,0.056287998954455055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,8,balanced,0.05778666834036509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,8,power_law_1.01,0.0541055977344513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,8,power_law_1.01,0.0546176016330719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,8,power_law_1.2,0.0545087993144989
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,1,8,power_law_1.2,0.05564799904823303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,16,1,balanced,0.033285332222779594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,16,1,balanced,0.03357866654793421
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,16,1,power_law_1.01,0.032332798838615416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,16,1,power_law_1.01,0.03247359991073608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,16,1,power_law_1.2,0.032332798838615416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,16,1,power_law_1.2,0.03281919956207276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,2,1,balanced,0.12430399656295776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,2,1,balanced,0.12667733430862427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,2,1,power_law_1.01,0.12307840585708618
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,2,1,power_law_1.01,0.12406400442123414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,2,1,power_law_1.2,0.11992319822311401
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,2,1,power_law_1.2,0.12496639490127563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,32,1,balanced,0.029130667448043823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,32,1,balanced,0.02974933385848999
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,32,1,power_law_1.01,0.027558401226997375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,32,1,power_law_1.01,0.028166401386260986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,32,1,power_law_1.2,0.027263998985290527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,32,1,power_law_1.2,0.027993598580360414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,4,1,balanced,0.0782773345708847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,4,1,balanced,0.07885333398977916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,4,1,power_law_1.01,0.07524480223655701
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,4,1,power_law_1.01,0.07674239873886109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,4,1,power_law_1.2,0.07580159902572632
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,4,1,power_law_1.2,0.07667840123176575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,8,1,balanced,0.05231466889381409
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,8,1,balanced,0.053898667295773826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,8,1,power_law_1.01,0.051571202278137204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,8,1,power_law_1.01,0.051635199785232545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,8,1,power_law_1.2,0.051583999395370485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,16384,2,8,8,1,power_law_1.2,0.05238400101661682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,1,balanced,0.3993706703186035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,1,balanced,0.400762677192688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,1,power_law_1.01,0.30405759811401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,1,power_law_1.01,0.31503360271453856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,1,power_law_1.2,0.27251200675964354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,1,power_law_1.2,0.2731519937515259
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,128,balanced,0.03149333347876867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,128,balanced,0.031530665854612984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,128,power_law_1.01,0.030681601166725157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,128,power_law_1.01,0.032364800572395325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,128,power_law_1.2,0.030067199468612672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,128,power_law_1.2,0.03018240034580231
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,16,balanced,0.05505600074927012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,16,balanced,0.055306668082873024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,16,power_law_1.01,0.07524480223655701
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,16,power_law_1.01,0.07637119889259339
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,16,power_law_1.2,0.07456640005111695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,16,power_law_1.2,0.0763584017753601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,2,balanced,0.21613333622614542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,2,balanced,0.21718400716781616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,2,power_law_1.01,0.18683520555496216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,2,power_law_1.01,0.1982975959777832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,2,power_law_1.2,0.17229440212249755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,2,power_law_1.2,0.1804095983505249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,256,balanced,0.029493334392706554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,256,balanced,0.03148266673088074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,256,power_law_1.01,0.029996800422668456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,256,power_law_1.01,0.03107840120792389
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,256,power_law_1.2,0.029120001196861266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,256,power_law_1.2,0.02919679880142212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,32,balanced,0.033488000432650246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,32,balanced,0.034661332766215004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,32,power_law_1.01,0.050988799333572386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,32,power_law_1.01,0.053260797262191774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,32,power_law_1.2,0.04810880124568939
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,32,power_law_1.2,0.04943360090255737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,4,balanced,0.12386133273442586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,4,balanced,0.12492266297340393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,4,power_law_1.01,0.13448959589004517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,4,power_law_1.01,0.1370687961578369
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,4,power_law_1.2,0.12250239849090576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,4,power_law_1.2,0.12567039728164672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,64,balanced,0.03141333411137263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,64,balanced,0.03163733333349228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,64,power_law_1.01,0.031020799279212953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,64,power_law_1.01,0.03245440125465393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,64,power_law_1.2,0.03157120048999786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,64,power_law_1.2,0.032307198643684386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,8,balanced,0.07825600107510884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,8,balanced,0.07864533364772797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,8,power_law_1.01,0.09842560291290284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,8,power_law_1.01,0.10364799499511719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,8,power_law_1.2,0.11157759428024291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,1,8,power_law_1.2,0.11222399473190307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,16,1,balanced,0.06740266581376393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,16,1,balanced,0.06799466907978058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,16,1,power_law_1.01,0.05734400153160095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,16,1,power_law_1.01,0.05809280276298523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,16,1,power_law_1.2,0.05420799851417542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,16,1,power_law_1.2,0.05496960282325745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,2,1,balanced,0.21782400210698447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,2,1,balanced,0.21819200118382773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,2,1,power_law_1.01,0.1668544054031372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,2,1,power_law_1.01,0.17285120487213135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,2,1,power_law_1.2,0.155840003490448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,2,1,power_law_1.2,0.15640319585800172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,32,1,balanced,0.05120533208052317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,32,1,balanced,0.05249600112438202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,32,1,power_law_1.01,0.04407039880752563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,32,1,power_law_1.01,0.04611839950084686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,32,1,power_law_1.2,0.042316800355911253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,32,1,power_law_1.2,0.043584001064300534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,4,1,balanced,0.12781866391499838
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,4,1,balanced,0.12796266873677573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,4,1,power_law_1.01,0.10224640369415283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,4,1,power_law_1.01,0.10421760082244873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,4,1,power_law_1.2,0.09188479781150818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,4,1,power_law_1.2,0.09267200231552124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,8,1,balanced,0.08518399794896443
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,8,1,balanced,0.08519466718037923
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,8,1,power_law_1.01,0.06884480118751526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,8,1,power_law_1.01,0.06974080204963684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,8,1,power_law_1.2,0.06536319851875305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2048,8,256,8,1,power_law_1.2,0.0668287992477417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,1,balanced,0.4901813268661499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,1,balanced,0.4922026793162028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,1,power_law_1.01,0.3019711971282959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,1,power_law_1.01,0.3068671941757202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,1,power_law_1.2,0.2745408058166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,1,power_law_1.2,0.2745984077453613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,16,balanced,0.06028800209363302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,16,balanced,0.06149866680304209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,16,power_law_1.01,0.05080320239067078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,16,power_law_1.01,0.06178560256958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,16,power_law_1.2,0.05251200199127197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,16,power_law_1.2,0.05348479747772217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,2,balanced,0.2630400061607361
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,2,balanced,0.2635786732037862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,2,power_law_1.01,0.17255680561065673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,2,power_law_1.01,0.18876800537109376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,2,power_law_1.2,0.1726207971572876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,2,power_law_1.2,0.17631360292434692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,32,balanced,0.04445866743723551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,32,balanced,0.0452106644709905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,32,power_law_1.01,0.03825919926166534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,32,power_law_1.01,0.04622719883918762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,32,power_law_1.2,0.04040960073471069
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,32,power_law_1.2,0.040608000755310056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,4,balanced,0.14684800306955972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,4,balanced,0.14756266276041666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,4,power_law_1.01,0.11457279920578003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,4,power_law_1.01,0.12896000146865844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,4,power_law_1.2,0.12110719680786133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,4,power_law_1.2,0.12225919961929321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,8,balanced,0.09079466263453166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,8,balanced,0.09085866808891296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,8,power_law_1.01,0.09039999842643738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,8,power_law_1.01,0.09219840168952942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,8,power_law_1.2,0.08391680121421814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,1,8,power_law_1.2,0.08789759874343872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,2,1,balanced,0.263045330842336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,2,1,balanced,0.2640480001767476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,2,1,power_law_1.01,0.16558079719543456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,2,1,power_law_1.01,0.16915839910507202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,2,1,power_law_1.2,0.14894720315933227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,2,1,power_law_1.2,0.15368319749832154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,4,1,balanced,0.1551146705945333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,4,1,balanced,0.15537066260973612
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,4,1,power_law_1.01,0.10327039957046509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,4,1,power_law_1.01,0.10409599542617798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,4,1,power_law_1.2,0.09389439821243287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,4,1,power_law_1.2,0.09905920028686524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,8,1,balanced,0.09575999776522319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,8,1,balanced,0.09679466485977173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,8,1,power_law_1.01,0.06775680184364319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,8,1,power_law_1.01,0.0685375988483429
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,8,1,power_law_1.2,0.06591359972953796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,6144,2560,8,160,8,1,power_law_1.2,0.06602879762649536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,1,balanced,0.461514671643575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,1,balanced,0.4624106486638387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,1,power_law_1.01,0.35365118980407717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,1,power_law_1.01,0.361625599861145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,1,power_law_1.2,0.31833600997924805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,1,power_law_1.2,0.32055680751800536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,128,balanced,0.033376000821590424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,128,balanced,0.03356799980004629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,128,power_law_1.01,0.03113600015640259
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,128,power_law_1.01,0.032492798566818235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,128,power_law_1.2,0.0315200001001358
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,128,power_law_1.2,0.03288959860801697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,16,balanced,0.05841066439946493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,16,balanced,0.058506667613983154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,16,power_law_1.01,0.07530879974365234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,16,power_law_1.01,0.08406400084495544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,16,power_law_1.2,0.08387839794158936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,16,power_law_1.2,0.08413439989089966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,2,balanced,0.2474986712137858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,2,balanced,0.24762133757273355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,2,power_law_1.01,0.21278719902038573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,2,power_law_1.01,0.22351999282836915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,2,power_law_1.2,0.19288320541381837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,2,power_law_1.2,0.1982143998146057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,256,balanced,0.031530665854612984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,256,balanced,0.031685332457224526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,256,power_law_1.01,0.029900801181793214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,256,power_law_1.01,0.031999999284744264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,256,power_law_1.2,0.030880001187324525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,256,power_law_1.2,0.03193599879741669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,32,balanced,0.03730133424202601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,32,balanced,0.041434665520985924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,32,power_law_1.01,0.055212801694869994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,32,power_law_1.01,0.05605760216712952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,32,power_law_1.2,0.04943360090255737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,32,power_law_1.2,0.05464320182800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,4,balanced,0.14034666617711386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,4,balanced,0.14070933063824972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,4,power_law_1.01,0.14395519495010375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,4,power_law_1.01,0.15731199979782104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,4,power_law_1.2,0.12375040054321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,4,power_law_1.2,0.1533568024635315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,64,balanced,0.03287466615438461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,64,balanced,0.03366400053103765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,64,power_law_1.01,0.03518719971179962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,64,power_law_1.01,0.03702400028705597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,64,power_law_1.2,0.03402880132198334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,64,power_law_1.2,0.034815999865531924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,8,balanced,0.08678932984670003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,8,balanced,0.0869706670443217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,8,power_law_1.01,0.10553599596023559
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,8,power_law_1.01,0.11429120302200317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,8,power_law_1.2,0.10759040117263793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,1,8,power_law_1.2,0.12568960189819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,16,1,balanced,0.07342933118343353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,16,1,balanced,0.07448533177375793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,16,1,power_law_1.01,0.06224640011787415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,16,1,power_law_1.01,0.06225280165672302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,16,1,power_law_1.2,0.058387202024459836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,16,1,power_law_1.2,0.06033279895782471
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,2,1,balanced,0.24758932987848917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,2,1,balanced,0.24854934215545654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,2,1,power_law_1.01,0.19118080139160157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,2,1,power_law_1.01,0.19345279932022094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,2,1,power_law_1.2,0.17786879539489747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,2,1,power_law_1.2,0.17957119941711425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,32,1,balanced,0.05809600154558817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,32,1,balanced,0.05991466840108236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,32,1,power_law_1.01,0.05007359981536865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,32,1,power_law_1.01,0.05095679759979248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,32,1,power_law_1.2,0.045977601408958436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,32,1,power_law_1.2,0.046751999855041505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,4,1,balanced,0.14220266540845236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,4,1,balanced,0.14243200421333313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,4,1,power_law_1.01,0.11340160369873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,4,1,power_law_1.01,0.11603840589523315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,4,1,power_law_1.2,0.10243200063705445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,4,1,power_law_1.2,0.1047551989555359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,8,1,balanced,0.09347732861836751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,8,1,balanced,0.09483733773231506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,8,1,power_law_1.01,0.07699840068817139
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,8,1,power_law_1.01,0.07816320061683654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,8,1,power_law_1.2,0.07274240255355835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,256,8,1,power_law_1.2,0.07326719760894776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,1,balanced,0.4620906511942546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,1,balanced,0.4625493288040161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,1,power_law_1.01,0.4143104076385498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,1,power_law_1.01,0.4147071838378906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,1,power_law_1.2,0.37798399925231935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,1,power_law_1.2,0.3789184093475342
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,128,balanced,0.033413333197434746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,128,balanced,0.03356799980004629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,128,power_law_1.01,0.033228799700737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,128,power_law_1.01,0.03472639918327332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,128,power_law_1.2,0.03247359991073608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,128,power_law_1.2,0.03365119993686676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,16,balanced,0.059290667374928795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,16,balanced,0.059434667229652405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,16,power_law_1.01,0.11055999994277954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,16,power_law_1.01,0.11088000535964966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,16,power_law_1.2,0.10843520164489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,16,power_law_1.2,0.11110399961471558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,2,balanced,0.2475093404452006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,2,balanced,0.24764800071716309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,2,power_law_1.01,0.26968960762023925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,2,power_law_1.01,0.2757951974868774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,2,power_law_1.2,0.239737606048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,2,power_law_1.2,0.24753921031951903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,32,balanced,0.038405333956082664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,32,balanced,0.039701332648595176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,32,power_law_1.01,0.06951680183410644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,32,power_law_1.01,0.07110400199890136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,32,power_law_1.2,0.06883199810981751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,32,power_law_1.2,0.07087360024452209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,4,balanced,0.13877333203951517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,4,balanced,0.14146133263905844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,4,power_law_1.01,0.18803199529647827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,4,power_law_1.01,0.19837440252304078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,4,power_law_1.2,0.17940479516983032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,4,power_law_1.2,0.18467199802398682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,64,balanced,0.03173333406448364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,64,balanced,0.033589333295822144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,64,power_law_1.01,0.04962559938430786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,64,power_law_1.01,0.05195519924163818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,64,power_law_1.2,0.04581120014190674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,64,power_law_1.2,0.05159040093421936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,8,balanced,0.08703999718030293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,8,balanced,0.08728532989819844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,8,power_law_1.01,0.14835200309753419
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,8,power_law_1.01,0.15461119413375854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,8,power_law_1.2,0.14052480459213257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,1,8,power_law_1.2,0.1506943941116333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,16,1,balanced,0.07371733089288075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,16,1,balanced,0.0747680018345515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,16,1,power_law_1.01,0.0673792004585266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,16,1,power_law_1.01,0.06782079935073852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,16,1,power_law_1.2,0.06524800062179566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,16,1,power_law_1.2,0.06570879817008972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,2,1,balanced,0.2494986653327942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,2,1,balanced,0.24958932399749756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,2,1,power_law_1.01,0.22128000259399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,2,1,power_law_1.01,0.23231360912322999
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,2,1,power_law_1.2,0.20647039413452148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,2,1,power_law_1.2,0.20692479610443115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,32,1,balanced,0.05945600072542826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,32,1,balanced,0.06001066664854685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,32,1,power_law_1.01,0.05482239723205566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,32,1,power_law_1.01,0.05511680245399475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,32,1,power_law_1.2,0.05314559936523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,32,1,power_law_1.2,0.0531711995601654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,4,1,balanced,0.14282666643460593
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,4,1,balanced,0.14312000075976053
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,4,1,power_law_1.01,0.12810879945755005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,4,1,power_law_1.01,0.131494402885437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,4,1,power_law_1.2,0.12129919528961182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,4,1,power_law_1.2,0.1217919945716858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,8,1,balanced,0.09329066673914592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,8,1,balanced,0.09405866265296936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,8,1,power_law_1.01,0.08492799997329711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,8,1,power_law_1.01,0.08515840172767639
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,8,1,power_law_1.2,0.08051199913024902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16,7168,2048,8,384,8,1,power_law_1.2,0.0805184006690979
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,1,balanced,0.09597866733868916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,1,balanced,0.09641066193580627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,1,power_law_1.01,0.08951039910316468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,1,power_law_1.01,0.09023360013961793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,1,power_law_1.2,0.09088640213012696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,1,power_law_1.2,0.09099519848823548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,128,balanced,0.03630933413902918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,128,balanced,0.037733333806196846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,128,power_law_1.01,0.03493120074272156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,128,power_law_1.01,0.035257598757743834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,128,power_law_1.2,0.03449600040912628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,128,power_law_1.2,0.035123199224472046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,16,balanced,0.0539626677831014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,16,balanced,0.054154664278030396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,16,power_law_1.01,0.048076799511909483
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,16,power_law_1.01,0.04822399914264679
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,16,power_law_1.2,0.046438398957252505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,16,power_law_1.2,0.04747520089149475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,2,balanced,0.05879466732343038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,2,balanced,0.05910933514436086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,2,power_law_1.01,0.05725439786911011
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,2,power_law_1.01,0.058348798751831056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,2,power_law_1.2,0.058739197254180905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,2,power_law_1.2,0.05935360193252563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,32,balanced,0.04576000074545542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,32,balanced,0.0458186666170756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,32,power_law_1.01,0.04095360040664673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,32,power_law_1.01,0.04149760007858276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,32,power_law_1.2,0.03882879912853241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,32,power_law_1.2,0.03909119963645935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,4,balanced,0.041562666495641075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,4,balanced,0.04381866753101349
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,4,power_law_1.01,0.04199680089950562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,4,power_law_1.01,0.042752000689506534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,4,power_law_1.2,0.040908798575401306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,4,power_law_1.2,0.041356799006462094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,64,balanced,0.039701332648595176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,64,balanced,0.03992533435424169
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,64,power_law_1.01,0.03656319975852966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,64,power_law_1.01,0.03764480054378509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,64,power_law_1.2,0.03532159924507141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,64,power_law_1.2,0.036473599076271054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,8,balanced,0.0439573327700297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,8,balanced,0.04557866851488749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,8,power_law_1.01,0.03871999979019165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,8,power_law_1.01,0.039027199149131775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,8,power_law_1.2,0.0379967987537384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,1,8,power_law_1.2,0.03914879858493805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,2,1,balanced,0.06817066669464111
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,2,1,balanced,0.06905599931875865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,2,1,power_law_1.01,0.06382719874382019
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,2,1,power_law_1.01,0.06424959897994995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,2,1,power_law_1.2,0.06407039761543273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,2,1,power_law_1.2,0.06506239771842956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,4,1,balanced,0.05481599768002828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,4,1,balanced,0.05606399973233541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,4,1,power_law_1.01,0.049721598625183105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,4,1,power_law_1.01,0.051974397897720334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,4,1,power_law_1.2,0.05139840245246887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,2048,768,8,128,4,1,power_law_1.2,0.05199360251426697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,1,balanced,0.3179093400637309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,1,balanced,0.31828800837198895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,1,power_law_1.01,0.27082879543304444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,1,power_law_1.01,0.2721407890319824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,1,power_law_1.2,0.27489280700683594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,1,power_law_1.2,0.28314239978790284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,128,balanced,0.03965866565704346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,128,balanced,0.03976000100374222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,128,power_law_1.01,0.039628800749778745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,128,power_law_1.01,0.04043520092964172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,128,power_law_1.2,0.03783040046691895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,128,power_law_1.2,0.03901439905166626
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,16,balanced,0.07817600170771281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,16,balanced,0.0787360022465388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,16,power_law_1.01,0.06639999747276307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,16,power_law_1.01,0.06842880249023438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,16,power_law_1.2,0.06429439783096313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,16,power_law_1.2,0.06584320068359376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,2,balanced,0.17684799432754517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,2,balanced,0.178165336449941
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,2,power_law_1.01,0.14890880584716798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,2,power_law_1.01,0.15639040470123292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,2,power_law_1.2,0.15693440437316894
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,2,power_law_1.2,0.1597759962081909
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,256,balanced,0.03984000037113825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,256,balanced,0.03993066648642222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,256,power_law_1.01,0.03760640025138855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,256,power_law_1.01,0.03772799968719483
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,256,power_law_1.2,0.03697920143604279
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,256,power_law_1.2,0.03699199855327606
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,32,balanced,0.09132267038027446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,32,balanced,0.10569600264231364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,32,power_law_1.01,0.08127999901771546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,32,power_law_1.01,0.08293759822845459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,32,power_law_1.2,0.07647359967231751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,32,power_law_1.2,0.08455039858818054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,4,balanced,0.10539199908574422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,4,balanced,0.1071626643339793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,4,power_law_1.01,0.09592959880828858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,4,power_law_1.01,0.09928960204124451
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,4,power_law_1.2,0.0943615972995758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,4,power_law_1.2,0.0950655996799469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,64,balanced,0.0563679983218511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,64,balanced,0.056549335519472756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,64,power_law_1.01,0.05129600167274475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,64,power_law_1.01,0.05420799851417542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,64,power_law_1.2,0.05192959904670715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,64,power_law_1.2,0.052275198698043826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,8,balanced,0.07242133220036824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,8,balanced,0.07270933190981548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,8,power_law_1.01,0.06511359810829162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,8,power_law_1.01,0.0654591977596283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,8,power_law_1.2,0.06398720145225525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,1,8,power_law_1.2,0.06603519916534424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,2,1,balanced,0.1800373395284017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,2,1,balanced,0.18054399887720743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,2,1,power_law_1.01,0.15801600217819214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,2,1,power_law_1.01,0.15884159803390502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,2,1,power_law_1.2,0.16157439947128296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,2,1,power_law_1.2,0.16352640390396117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,4,1,balanced,0.1150986651579539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,4,1,balanced,0.11584533254305522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,4,1,power_law_1.01,0.10334080457687378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,4,1,power_law_1.01,0.10584319829940796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,4,1,power_law_1.2,0.10506880283355713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,4,1,power_law_1.2,0.10674560070037842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,8,1,balanced,0.08452266454696655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,8,1,balanced,0.08562133709589641
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,8,1,power_law_1.01,0.08119040131568908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,8,1,power_law_1.01,0.08138239979743958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,8,1,power_law_1.2,0.08121600151062011
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,3072,1536,8,256,8,1,power_law_1.2,0.0828607976436615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,1,balanced,0.19554666678110758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,1,balanced,0.195850670337677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,1,power_law_1.01,0.1921023964881897
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,1,power_law_1.01,0.19304959774017333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,1,power_law_1.2,0.190937602519989
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,1,power_law_1.2,0.19377919435501098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,2,balanced,0.11913067102432251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,2,balanced,0.12057600418726604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,2,power_law_1.01,0.11571840047836304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,2,power_law_1.01,0.13619199991226197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,2,power_law_1.2,0.1301695942878723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,2,power_law_1.2,0.13797119855880738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,4,balanced,0.2225173314412435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,4,balanced,0.22566932439804077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,4,power_law_1.01,0.12286720275878907
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,4,power_law_1.01,0.1520640015602112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,4,power_law_1.2,0.10150400400161744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,4,power_law_1.2,0.22244479656219482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,8,balanced,0.14331733187039694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,8,balanced,0.15839999914169312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,8,power_law_1.01,0.10756479501724243
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,8,power_law_1.01,0.1428928017616272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,8,power_law_1.2,0.10024319887161255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,1,8,power_law_1.2,0.10537600517272949
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,16,1,balanced,0.03975466638803482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,16,1,balanced,0.03984000037113825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,16,1,power_law_1.01,0.03858560025691986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,16,1,power_law_1.01,0.03906559944152832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,16,1,power_law_1.2,0.038022398948669434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,16,1,power_law_1.2,0.03909119963645935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,2,1,balanced,0.10905599594116211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,2,1,balanced,0.10966400305430095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,2,1,power_law_1.01,0.10967040061950684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,2,1,power_law_1.01,0.11140480041503906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,2,1,power_law_1.2,0.10753920078277587
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,2,1,power_law_1.2,0.11057920455932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,32,1,balanced,0.035530666510264076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,32,1,balanced,0.03561066587766012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,32,1,power_law_1.01,0.03372800052165985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,32,1,power_law_1.01,0.03390080034732819
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,32,1,power_law_1.2,0.03351039886474609
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,32,1,power_law_1.2,0.03369599878787995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,4,1,balanced,0.07247466842333476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,4,1,balanced,0.0734506646792094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,4,1,power_law_1.01,0.0697920024394989
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,4,1,power_law_1.01,0.07044479846954346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,4,1,power_law_1.2,0.06889600157737732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,4,1,power_law_1.2,0.07071999907493591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,8,1,balanced,0.05491200089454651
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,8,1,balanced,0.05592533449331919
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,8,1,power_law_1.01,0.05116159915924072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,8,1,power_law_1.01,0.051641601324081424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,8,1,power_law_1.2,0.05170559883117676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,14336,2,8,8,1,power_law_1.2,0.05240960121154785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,1,balanced,0.2571733395258586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,1,balanced,0.25780800978342694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,1,power_law_1.01,0.24622080326080323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,1,power_law_1.01,0.25014400482177734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,1,power_law_1.2,0.24895999431610108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,1,power_law_1.2,0.2516479969024658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,128,balanced,0.04158399999141693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,128,balanced,0.04165333261092504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,128,power_law_1.01,0.03971840143203735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,128,power_law_1.01,0.03975679874420166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,128,power_law_1.2,0.03925760090351105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,128,power_law_1.2,0.04009599983692169
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,16,balanced,0.1092639962832133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,16,balanced,0.1160533328851064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,16,power_law_1.01,0.0923583984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,16,power_law_1.01,0.10400639772415161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,16,power_law_1.2,0.09684479832649232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,16,power_law_1.2,0.10006400346755981
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,2,balanced,0.13289599617322287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,2,balanced,0.13461333513259888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,2,power_law_1.01,0.13107839822769166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,2,power_law_1.01,0.1327296018600464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,2,power_law_1.2,0.13022719621658324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,2,power_law_1.2,0.13277440071105956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,32,balanced,0.056048000852266945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,32,balanced,0.05625066657861074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,32,power_law_1.01,0.050316798686981204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,32,power_law_1.01,0.050400000810623166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,32,power_law_1.2,0.047219198942184445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,32,power_law_1.2,0.04837760031223297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,4,balanced,0.0865226686000824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,4,balanced,0.08824533224105835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,4,power_law_1.01,0.082259202003479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,4,power_law_1.01,0.08558080196380616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,4,power_law_1.2,0.0862335979938507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,4,power_law_1.2,0.08673279881477355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,64,balanced,0.04181333382924398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,64,balanced,0.04322133461634318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,64,power_law_1.01,0.039417600631713866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,64,power_law_1.01,0.040089601278305055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,64,power_law_1.2,0.03984000086784363
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,64,power_law_1.2,0.03986560106277466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,8,balanced,0.08474133412043254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,8,balanced,0.0848640004793803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,8,power_law_1.01,0.07176960110664368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,8,power_law_1.01,0.07335039973258972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,8,power_law_1.2,0.06753280162811279
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,1,8,power_law_1.2,0.06889600157737732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,2,1,balanced,0.1625920037428538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,2,1,balanced,0.16499732931454977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,2,1,power_law_1.01,0.14752639532089235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,2,1,power_law_1.01,0.15077120065689087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,2,1,power_law_1.2,0.15338239669799805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,2,1,power_law_1.2,0.15464320182800292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,4,1,balanced,0.10689066847165425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,4,1,balanced,0.10693867007891338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,4,1,power_law_1.01,0.09710080027580262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,4,1,power_law_1.01,0.09813119769096375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,4,1,power_law_1.2,0.09670400023460388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,4,1,power_law_1.2,0.09816319942474365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,8,1,balanced,0.08413333694140117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,8,1,balanced,0.08521599570910136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,8,1,power_law_1.01,0.0775168001651764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,8,1,power_law_1.01,0.07758079767227173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,8,1,power_law_1.2,0.07790719866752624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,4096,1536,8,128,8,1,power_law_1.2,0.07800319790840149
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,1,balanced,0.38206934928894043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,1,balanced,0.38397332032521564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,1,power_law_1.01,0.3501823902130127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,1,power_law_1.01,0.3568063974380493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,1,power_law_1.2,0.33680000305175783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,1,power_law_1.2,0.34443519115447996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,2,balanced,0.16527466972668967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,2,balanced,0.1683466633160909
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,2,power_law_1.01,0.17579519748687744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,2,power_law_1.01,0.18725119829177855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,2,power_law_1.2,0.1784000039100647
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,2,power_law_1.2,0.18234239816665648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,4,balanced,0.2709226608276367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,4,balanced,0.28549333413441974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,4,power_law_1.01,0.17748479843139647
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,4,power_law_1.01,0.1928063988685608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,4,power_law_1.2,0.17635200023651124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,4,power_law_1.2,0.1864192008972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,8,balanced,0.1690453290939331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,8,balanced,0.17538134256998697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,8,power_law_1.01,0.16469759941101075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,8,power_law_1.01,0.17618559598922728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,8,power_law_1.2,0.10027519464492798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,1,8,power_law_1.2,0.16651519536972045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,16,1,balanced,0.051856001218159996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,16,1,balanced,0.05188799897829691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,16,1,power_law_1.01,0.04966399967670441
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,16,1,power_law_1.01,0.05008000135421753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,16,1,power_law_1.2,0.048582398891448976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,16,1,power_law_1.2,0.0500544011592865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,2,1,balanced,0.15744533141454062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,2,1,balanced,0.15868266423543295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,2,1,power_law_1.01,0.15991040468215942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,2,1,power_law_1.01,0.16170239448547363
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,2,1,power_law_1.2,0.1633344054222107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,2,1,power_law_1.2,0.163481605052948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,32,1,balanced,0.03941866755485535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,32,1,balanced,0.03988266736268997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,32,1,power_law_1.01,0.03687680065631867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,32,1,power_law_1.01,0.03752320110797882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,32,1,power_law_1.2,0.036550399661064145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,32,1,power_law_1.2,0.037248000502586365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,4,1,balanced,0.0988213320573171
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,4,1,balanced,0.09924266735712688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,4,1,power_law_1.01,0.09879680275917054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,4,1,power_law_1.01,0.09979519844055176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,4,1,power_law_1.2,0.09631999731063842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,4,1,power_law_1.2,0.09855999946594238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,8,1,balanced,0.06871466835339864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,8,1,balanced,0.0702453354994456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,8,1,power_law_1.01,0.06775680184364319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,8,1,power_law_1.01,0.06839039921760559
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,8,1,power_law_1.2,0.06678400039672852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,16384,2,8,8,1,power_law_1.2,0.06810879707336426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,1,balanced,0.7871039708455404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,1,balanced,0.7897013028462728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,1,power_law_1.01,0.6760704040527343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,1,power_law_1.01,0.6806655883789062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,1,power_law_1.2,0.682041597366333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,1,power_law_1.2,0.7014400005340576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,128,balanced,0.050010666251182556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,128,balanced,0.05004266897837321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,128,power_law_1.01,0.046726399660110475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,128,power_law_1.01,0.04812160134315491
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,128,power_law_1.2,0.04593279957771301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,128,power_law_1.2,0.0480320006608963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,16,balanced,0.12495467066764832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,16,balanced,0.12573333581288657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,16,power_law_1.01,0.10046080350875855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,16,power_law_1.01,0.10907520055770874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,16,power_law_1.2,0.10570240020751953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,16,power_law_1.2,0.10808320045471191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,2,balanced,0.4127253293991089
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,2,balanced,0.41344531377156574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,2,power_law_1.01,0.35427839756011964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,2,power_law_1.01,0.36745600700378417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,2,power_law_1.2,0.36221439838409425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,2,power_law_1.2,0.36868479251861574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,256,balanced,0.043680002291997276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,256,balanced,0.04386133452256521
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,256,power_law_1.01,0.042956799268722534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,256,power_law_1.01,0.04376319944858551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,256,power_law_1.2,0.04259200096130371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,256,power_law_1.2,0.042803201079368594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,32,balanced,0.18733867009480795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,32,balanced,0.19242133696873984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,32,power_law_1.01,0.15567359924316407
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,32,power_law_1.01,0.17935999631881713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,32,power_law_1.2,0.160863995552063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,32,power_law_1.2,0.1770815968513489
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,4,balanced,0.22521599133809408
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,4,balanced,0.2278133432070414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,4,power_law_1.01,0.1997056007385254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,4,power_law_1.01,0.21073920726776124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,4,power_law_1.2,0.21009280681610107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,4,power_law_1.2,0.21023359298706054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,64,balanced,0.09723200400670369
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,64,balanced,0.10131733616193135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,64,power_law_1.01,0.08711680173873901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,64,power_law_1.01,0.08823040127754211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,64,power_law_1.2,0.08858879804611205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,64,power_law_1.2,0.09009280204772949
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,8,balanced,0.13591999808947244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,8,balanced,0.13658666610717773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,8,power_law_1.01,0.11970560550689698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,8,power_law_1.01,0.127839994430542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,8,power_law_1.2,0.12019200325012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,1,8,power_law_1.2,0.12130559682846069
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,16,1,balanced,0.11412266890207927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,16,1,balanced,0.1153706709543864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,16,1,power_law_1.01,0.11038719415664673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,16,1,power_law_1.01,0.11179519891738891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,16,1,power_law_1.2,0.11235200166702271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,16,1,power_law_1.2,0.1145408034324646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,2,1,balanced,0.41276268164316815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,2,1,balanced,0.41437331835428876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,2,1,power_law_1.01,0.3564095973968506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,2,1,power_law_1.01,0.35797119140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,2,1,power_law_1.2,0.36205439567565917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,2,1,power_law_1.2,0.365011191368103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,32,1,balanced,0.09684266646703084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,32,1,balanced,0.09685867031415303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,32,1,power_law_1.01,0.09712640047073365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,32,1,power_law_1.01,0.09780480265617371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,32,1,power_law_1.2,0.09937919974327088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,32,1,power_law_1.2,0.10014079809188843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,4,1,balanced,0.2323360045750936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,4,1,balanced,0.23302932580312094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,4,1,power_law_1.01,0.20616319179534912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,4,1,power_law_1.01,0.20807039737701416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,4,1,power_law_1.2,0.2068095922470093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,4,1,power_law_1.2,0.20707199573516846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,8,1,balanced,0.1483573317527771
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,8,1,balanced,0.14910399913787842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,8,1,power_law_1.01,0.13935999870300292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,8,1,power_law_1.01,0.13978240489959717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,8,1,power_law_1.2,0.14083839654922486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2048,8,256,8,1,power_law_1.2,0.14110080003738404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,1,balanced,0.6254453261693319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,1,balanced,0.6260480086008707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,1,power_law_1.01,0.6310912132263183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,1,power_law_1.01,0.6391295909881591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,1,power_law_1.2,0.6475200176239013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,1,power_law_1.2,0.6705152034759522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,16,balanced,0.09715200463930766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,16,balanced,0.09833600123723348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,16,power_law_1.01,0.08396160006523132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,16,power_law_1.01,0.08522239923477173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,16,power_law_1.2,0.07868160009384155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,16,power_law_1.2,0.08247039914131164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,2,balanced,0.3323360085487366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,2,balanced,0.3335253397623698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,2,power_law_1.01,0.33827838897705076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,2,power_law_1.01,0.3430847883224487
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,2,power_law_1.2,0.35368320941925047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,2,power_law_1.2,0.3569216012954712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,32,balanced,0.16269866625467935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,32,balanced,0.16755199432373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,32,power_law_1.01,0.13148159980773927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,32,power_law_1.01,0.14435839653015137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,32,power_law_1.2,0.11738879680633545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,32,power_law_1.2,0.12550400495529174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,4,balanced,0.1856106718381246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,4,balanced,0.18585066000620523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,4,power_law_1.01,0.18178559541702272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,4,power_law_1.01,0.1850816011428833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,4,power_law_1.2,0.1815616011619568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,4,power_law_1.2,0.18474240303039552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,8,balanced,0.1153706709543864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,8,balanced,0.11629866560300191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,8,power_law_1.01,0.11091840267181396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,8,power_law_1.01,0.11132160425186158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,8,power_law_1.2,0.10981760025024415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,1,8,power_law_1.2,0.11263359785079956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,2,1,balanced,0.3347253402074178
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,2,1,balanced,0.33532265822092694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,2,1,power_law_1.01,0.34046719074249265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,2,1,power_law_1.01,0.345030403137207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,2,1,power_law_1.2,0.35891199111938477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,2,1,power_law_1.2,0.3622783899307251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,4,1,balanced,0.1963040033976237
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,4,1,balanced,0.1967680056889852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,4,1,power_law_1.01,0.2112895965576172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,4,1,power_law_1.01,0.2118079900741577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,4,1,power_law_1.2,0.21358079910278321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,4,1,power_law_1.2,0.21504640579223633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,8,1,balanced,0.1241333285967509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,8,1,balanced,0.12517866492271423
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,8,1,power_law_1.01,0.13062399625778198
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,8,1,power_law_1.01,0.13111679553985595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,8,1,power_law_1.2,0.13215999603271483
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,6144,2560,8,160,8,1,power_law_1.2,0.13470079898834228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,1,balanced,0.9135839939117432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,1,balanced,0.9147146542867025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,1,power_law_1.01,0.785152006149292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,1,power_law_1.01,0.7854591846466065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,1,power_law_1.2,0.7974207878112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,1,power_law_1.2,0.8129983901977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,128,balanced,0.05590933561325073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,128,balanced,0.05620799958705902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,128,power_law_1.01,0.0517632007598877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,128,power_law_1.01,0.0526528000831604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,128,power_law_1.2,0.05243520140647888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,128,power_law_1.2,0.05374720096588135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,16,balanced,0.13623467087745667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,16,balanced,0.13700266679128012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,16,power_law_1.01,0.11356159448623657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,16,power_law_1.01,0.11893119812011718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,16,power_law_1.2,0.110099196434021
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,16,power_law_1.2,0.11612800359725953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,2,balanced,0.47494399547576904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,2,balanced,0.4763466517130534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,2,power_law_1.01,0.4143360137939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,2,power_law_1.01,0.4257728099822998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,2,power_law_1.2,0.41896958351135255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,2,power_law_1.2,0.4336128234863281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,256,balanced,0.047968000173568726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,256,balanced,0.04798933366934458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,256,power_law_1.01,0.04449920058250427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,256,power_law_1.01,0.04568960070610047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,256,power_law_1.2,0.0447488009929657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,256,power_law_1.2,0.04550400078296661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,32,balanced,0.20517865816752115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,32,balanced,0.21172267198562622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,32,power_law_1.01,0.19128960371017456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,32,power_law_1.01,0.19274239540100097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,32,power_law_1.2,0.17605119943618774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,32,power_law_1.2,0.18405760526657106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,4,balanced,0.25916266441345215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,4,balanced,0.2594826618830363
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,4,power_law_1.01,0.22421119213104249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,4,power_law_1.01,0.23444480895996095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,4,power_law_1.2,0.22597119808197022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,4,power_law_1.2,0.2293760061264038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,64,balanced,0.11149332920710246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,64,balanced,0.11442666252454121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,64,power_law_1.01,0.09082880020141601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,64,power_law_1.01,0.10240639448165893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,64,power_law_1.2,0.07930240035057068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,64,power_law_1.2,0.09367679953575134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,8,balanced,0.15267733732859293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,8,balanced,0.15406399965286255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,8,power_law_1.01,0.13774720430374146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,8,power_law_1.01,0.13827199935913087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,8,power_law_1.2,0.1384703993797302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,1,8,power_law_1.2,0.1439743995666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,16,1,balanced,0.12851199507713318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,16,1,balanced,0.1290720005830129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,16,1,power_law_1.01,0.12621439695358277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,16,1,power_law_1.01,0.12769919633865356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,16,1,power_law_1.2,0.1260800004005432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,16,1,power_law_1.2,0.12738560438156127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,2,1,balanced,0.47791465123494464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,2,1,balanced,0.4786986509958903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,2,1,power_law_1.01,0.4141248226165771
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,2,1,power_law_1.01,0.41955199241638186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,2,1,power_law_1.2,0.41841921806335447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,2,1,power_law_1.2,0.4200128078460693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,32,1,balanced,0.10711466272672017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,32,1,balanced,0.10919466614723206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,32,1,power_law_1.01,0.10826879739761353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,32,1,power_law_1.01,0.11078399419784546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,32,1,power_law_1.2,0.11063040494918823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,32,1,power_law_1.2,0.11179519891738891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,4,1,balanced,0.2661653359731038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,4,1,balanced,0.2680799961090088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,4,1,power_law_1.01,0.2360383987426758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,4,1,power_law_1.01,0.23950719833374023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,4,1,power_law_1.2,0.23804159164428712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,4,1,power_law_1.2,0.23868799209594727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,8,1,balanced,0.16851200660069784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,8,1,balanced,0.17005334297815958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,8,1,power_law_1.01,0.1578495979309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,8,1,power_law_1.01,0.1600383996963501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,8,1,power_law_1.2,0.15921920537948608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,256,8,1,power_law_1.2,0.16061439514160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,1,balanced,1.3419893582661946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,1,balanced,1.3427839279174805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,1,power_law_1.01,1.0299776077270508
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,1,power_law_1.01,1.0321408271789552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,1,power_law_1.2,1.0196736335754395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,1,power_law_1.2,1.0318464279174804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,128,balanced,0.09598933657010396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,128,balanced,0.09684266646703084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,128,power_law_1.01,0.08791679739952088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,128,power_law_1.01,0.08997120261192322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,128,power_law_1.2,0.08618239760398864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,128,power_law_1.2,0.0884223997592926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,16,balanced,0.12797333796819052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,16,balanced,0.12876266241073608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,16,power_law_1.01,0.10341119766235352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,16,power_law_1.01,0.11149439811706544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,16,power_law_1.2,0.10673919916152955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,16,power_law_1.2,0.11521919965744018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,2,balanced,0.6890239715576172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,2,balanced,0.6902026335398356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,2,power_law_1.01,0.5623487949371337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,2,power_law_1.01,0.5736192226409912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,2,power_law_1.2,0.5525311946868896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,2,power_law_1.2,0.5778751850128174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,32,balanced,0.11497599879900615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,32,balanced,0.11675199866294861
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,32,power_law_1.01,0.09868159890174866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,32,power_law_1.01,0.10483200550079345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,32,power_law_1.2,0.09366400241851806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,32,power_law_1.2,0.09587200284004212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,4,balanced,0.36189866065979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,4,balanced,0.36190398534138996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,4,power_law_1.01,0.3077375888824463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,4,power_law_1.01,0.340883207321167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,4,power_law_1.2,0.2909503936767578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,4,power_law_1.2,0.2970304012298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,64,balanced,0.17516799767812094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,64,balanced,0.19337066014607748
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,64,power_law_1.01,0.15676800012588502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,64,power_law_1.01,0.17067519426345826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,64,power_law_1.2,0.14265600442886353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,64,power_law_1.2,0.14380160570144654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,8,balanced,0.20533865690231323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,8,balanced,0.2067199945449829
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,8,power_law_1.01,0.16974719762802123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,8,power_law_1.01,0.1948799967765808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,8,power_law_1.2,0.16177279949188234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,1,8,power_law_1.2,0.16890239715576172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,16,1,balanced,0.16777066389719644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,16,1,balanced,0.16898133357365927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,16,1,power_law_1.01,0.1487552046775818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,16,1,power_law_1.01,0.1487936019897461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,16,1,power_law_1.2,0.1483839988708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,16,1,power_law_1.2,0.14918400049209596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,2,1,balanced,0.6919413407643636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,2,1,balanced,0.6928373177846273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,2,1,power_law_1.01,0.5402751922607422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,2,1,power_law_1.01,0.5492991924285888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,2,1,power_law_1.2,0.5287487983703614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,2,1,power_law_1.2,0.5334847927093506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,32,1,balanced,0.1402186652024587
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,32,1,balanced,0.14036267002423605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,32,1,power_law_1.01,0.12706559896469116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,32,1,power_law_1.01,0.12829439640045165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,32,1,power_law_1.2,0.12775039672851562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,32,1,power_law_1.2,0.13032959699630736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,4,1,balanced,0.373306671778361
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,4,1,balanced,0.3754986524581909
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,4,1,power_law_1.01,0.30079360008239747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,4,1,power_law_1.01,0.3012415885925293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,4,1,power_law_1.2,0.2977344036102295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,4,1,power_law_1.2,0.3007040023803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,8,1,balanced,0.2260800004005432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,8,1,balanced,0.2274186611175537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,8,1,power_law_1.01,0.1929471969604492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,8,1,power_law_1.01,0.19344639778137207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,8,1,power_law_1.2,0.19033600091934205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,160,7168,2048,8,384,8,1,power_law_1.2,0.19132159948348998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,1,balanced,0.8197279771169027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,1,balanced,0.8310186862945557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,1,power_law_1.01,0.9002240180969239
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,1,power_law_1.01,0.9027775764465332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,1,power_law_1.2,0.9203328132629395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,1,power_law_1.2,0.9324607849121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,128,balanced,0.19646932681401572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,128,balanced,0.19659199317296347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,128,power_law_1.01,0.23475840091705322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,128,power_law_1.01,0.23807361125946044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,128,power_law_1.2,0.26679680347442625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,128,power_law_1.2,0.2694080114364624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,16,balanced,0.23136534293492636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,16,balanced,0.23148800929387411
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,16,power_law_1.01,0.28083200454711915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,16,power_law_1.01,0.29249279499053954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,16,power_law_1.2,0.32503039836883546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,16,power_law_1.2,0.35164799690246584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,2,balanced,0.5022720098495483
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,2,balanced,0.5022826592127482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,2,power_law_1.01,0.5750847816467285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,2,power_law_1.01,0.5904767990112305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,2,power_law_1.2,0.6267263889312744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,2,power_law_1.2,0.629260778427124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,32,balanced,0.20947200059890747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,32,balanced,0.2107093334197998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,32,power_law_1.01,0.26759679317474366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,32,power_law_1.01,0.2686912059783936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,32,power_law_1.2,0.29781761169433596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,32,power_law_1.2,0.3031487941741943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,4,balanced,0.34967998663584393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,4,balanced,0.3503146568934123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,4,power_law_1.01,0.42882561683654785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,4,power_law_1.01,0.43965439796447753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,4,power_law_1.2,0.4429056167602539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,4,power_law_1.2,0.4484288215637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,64,balanced,0.20097599426905313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,64,balanced,0.20115200678507486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,64,power_law_1.01,0.25073919296264646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,64,power_law_1.01,0.2541183948516846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,64,power_law_1.2,0.2808768033981323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,64,power_law_1.2,0.28219521045684814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,8,balanced,0.27213867505391437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,8,balanced,0.27238933245340985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,8,power_law_1.01,0.3269824028015137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,8,power_law_1.01,0.34206719398498536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,8,power_law_1.2,0.35691521167755125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,1,8,power_law_1.2,0.3732736110687256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,2,1,balanced,0.6055573225021362
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,2,1,balanced,0.6079253355662028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,2,1,power_law_1.01,0.6295487880706787
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,2,1,power_law_1.01,0.6339776039123535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,2,1,power_law_1.2,0.6385151863098144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,2,1,power_law_1.2,0.6512767791748046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,4,1,balanced,0.5227466821670532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,4,1,balanced,0.5243786573410034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,4,1,power_law_1.01,0.5399040222167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,4,1,power_law_1.01,0.540172815322876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,4,1,power_law_1.2,0.5422592163085938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,2048,768,8,128,4,1,power_law_1.2,0.5503039836883545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,1,balanced,1.5553065935770671
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,1,balanced,1.6056267420450847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,1,power_law_1.01,2.1660160064697265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,1,power_law_1.01,2.25296630859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,1,power_law_1.2,2.316716766357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,1,power_law_1.2,2.331283187866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,128,balanced,0.2726080020268758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,128,balanced,0.2730986674626668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,128,power_law_1.01,0.32047998905181885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,128,power_law_1.01,0.3209023952484131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,128,power_law_1.2,0.3606208086013794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,128,power_law_1.2,0.3772223949432373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,16,balanced,0.3408159812291463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,16,balanced,0.34084800879160565
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,16,power_law_1.01,0.4840384006500244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,16,power_law_1.01,0.49013118743896483
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,16,power_law_1.2,0.5127103805541993
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,16,power_law_1.2,0.541484785079956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,2,balanced,0.8789172967274984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,2,balanced,0.8828480243682861
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,2,power_law_1.01,1.4447423934936523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,2,power_law_1.01,1.5474047660827637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,2,power_law_1.2,1.6173311233520509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,2,power_law_1.2,1.6271167755126954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,256,balanced,0.26921067635218304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,256,balanced,0.2698240081469218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,256,power_law_1.01,0.30385279655456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,256,power_law_1.01,0.3067712068557739
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,256,power_law_1.2,0.3581183910369873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,256,power_law_1.2,0.36538240909576414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,32,balanced,0.299834668636322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,32,balanced,0.3018346627553304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,32,power_law_1.01,0.3993535995483398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,32,power_law_1.01,0.4060031890869141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,32,power_law_1.2,0.4521279811859131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,32,power_law_1.2,0.47253761291503904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,4,balanced,0.5726026693979899
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,4,balanced,0.573861320813497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,4,power_law_1.01,0.9314816474914551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,4,power_law_1.01,0.9873344421386718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,4,power_law_1.2,1.0664192199707032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,4,power_law_1.2,1.0996800422668458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,64,balanced,0.28067199389139813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,64,balanced,0.2807893355687459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,64,power_law_1.01,0.34853758811950686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,64,power_law_1.01,0.3542527914047241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,64,power_law_1.2,0.39611520767211916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,64,power_law_1.2,0.40773758888244627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,8,balanced,0.4204639991124471
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,8,balanced,0.4222986698150635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,8,power_law_1.01,0.6273344039916993
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,8,power_law_1.01,0.668006420135498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,8,power_law_1.2,0.6890751838684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,1,8,power_law_1.2,0.7295487880706787
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,2,1,balanced,0.9852960109710693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,2,1,balanced,0.9882826805114746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,2,1,power_law_1.01,1.337446403503418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,2,1,power_law_1.01,1.363916778564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,2,1,power_law_1.2,1.365670394897461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,2,1,power_law_1.2,1.3720767974853516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,4,1,balanced,0.74562668800354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,4,1,balanced,0.7476480007171631
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,4,1,power_law_1.01,0.9418560028076172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,4,1,power_law_1.01,0.9509183883666992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,4,1,power_law_1.2,0.9492351531982421
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,4,1,power_law_1.2,0.9555135726928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,8,1,balanced,0.6616266568501791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,8,1,balanced,0.6633386611938477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,8,1,power_law_1.01,0.7788479804992676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,8,1,power_law_1.01,0.7861504077911377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,8,1,power_law_1.2,0.798144006729126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,3072,1536,8,256,8,1,power_law_1.2,0.8246591567993165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,1,balanced,3.3745333353678384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,1,balanced,3.5080747604370117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,1,power_law_1.01,3.3908863067626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,1,power_law_1.01,3.4933441162109373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,1,power_law_1.2,3.4978305816650392
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,1,power_law_1.2,3.5545406341552734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,2,balanced,1.7474986712137859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,2,balanced,1.7807572682698567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,2,power_law_1.01,2.143494415283203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,2,power_law_1.01,2.2623104095458983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,2,power_law_1.2,2.232415962219238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,2,power_law_1.2,2.661260795593262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,4,balanced,1.024506648381551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,4,balanced,1.025210698445638
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,4,power_law_1.01,1.7665023803710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,4,power_law_1.01,1.8631551742553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,4,power_law_1.2,1.8312448501586913
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,4,power_law_1.2,1.9345663070678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,8,balanced,0.6601386864980062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,8,balanced,0.6611359914143881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,8,power_law_1.01,1.56046724319458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,8,power_law_1.01,1.604217529296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,8,power_law_1.2,1.6479999542236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,1,8,power_law_1.2,1.7314624786376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,16,1,balanced,0.547765334447225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,16,1,balanced,0.5492480198542277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,16,1,power_law_1.01,0.546950387954712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,16,1,power_law_1.01,0.5500160217285156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,16,1,power_law_1.2,0.5518464088439942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,16,1,power_law_1.2,0.5521279811859131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,2,1,balanced,1.7650292714436848
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,2,1,balanced,1.789749304453532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,2,1,power_law_1.01,1.8549055099487304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,2,1,power_law_1.01,1.9030975341796874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,2,1,power_law_1.2,1.8654912948608398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,2,1,power_law_1.2,1.866579246520996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,32,1,balanced,0.466106653213501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,32,1,balanced,0.4664693276087443
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,32,1,power_law_1.01,0.4698239803314209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,32,1,power_law_1.01,0.46990718841552737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,32,1,power_law_1.2,0.46675839424133303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,32,1,power_law_1.2,0.4673471927642822
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,4,1,balanced,1.064677317937215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,4,1,balanced,1.0647413730621338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,4,1,power_law_1.01,1.109785556793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,4,1,power_law_1.01,1.121664047241211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,4,1,power_law_1.2,1.0953984260559082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,4,1,power_law_1.2,1.124294376373291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,8,1,balanced,0.7138026555379232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,8,1,balanced,0.7179146607716879
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,8,1,power_law_1.01,0.7267327785491944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,8,1,power_law_1.01,0.7292863845825195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,8,1,power_law_1.2,0.7251520156860352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,14336,2,8,8,1,power_law_1.2,0.728268814086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,1,balanced,1.848042647043864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,1,balanced,1.8501760164896648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,1,power_law_1.01,2.2760383605957033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,1,power_law_1.01,2.289267158508301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,1,power_law_1.2,2.3472831726074217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,1,power_law_1.2,2.3745599746704102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,128,balanced,0.3359466791152954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,128,balanced,0.33694398403167725
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,128,power_law_1.01,0.41455998420715334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,128,power_law_1.01,0.423199987411499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,128,power_law_1.2,0.4903615951538086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,128,power_law_1.2,0.4987775802612305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,16,balanced,0.41309332847595215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,16,balanced,0.4136799971262614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,16,power_law_1.01,0.5729983806610107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,16,power_law_1.01,0.5994048118591309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,16,power_law_1.2,0.6051136016845703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,16,power_law_1.2,0.6203711986541748
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,2,balanced,1.038815975189209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,2,balanced,1.0437599817911785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,2,power_law_1.01,1.4224831581115722
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,2,power_law_1.01,1.4341312408447267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,2,power_law_1.2,1.5300607681274414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,2,power_law_1.2,1.577945613861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,32,balanced,0.3692320187886556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,32,balanced,0.36935468514760333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,32,power_law_1.01,0.4938176155090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,32,power_law_1.01,0.4994815826416016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,32,power_law_1.2,0.542310380935669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,32,power_law_1.2,0.5798272132873535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,4,balanced,0.6773333549499512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,4,balanced,0.6776959896087646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,4,power_law_1.01,0.9459456443786621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,4,power_law_1.01,1.009881591796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,4,power_law_1.2,1.08023681640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,4,power_law_1.2,1.0874176025390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,64,balanced,0.34537601470947266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,64,balanced,0.3463360071182251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,64,power_law_1.01,0.45749759674072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,64,power_law_1.01,0.45757441520690917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,64,power_law_1.2,0.5094143867492675
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,64,power_law_1.2,0.5204351902008056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,8,balanced,0.5030879974365234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,8,balanced,0.5035946766535441
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,8,power_law_1.01,0.7220416069030762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,8,power_law_1.01,0.7385856151580811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,8,power_law_1.2,0.8010944366455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,1,8,power_law_1.2,0.823635196685791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,2,1,balanced,1.2072160243988037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,2,1,balanced,1.2193493048350017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,2,1,power_law_1.01,1.4026687622070313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,2,1,power_law_1.01,1.4167936325073243
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,2,1,power_law_1.2,1.4721471786499023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,2,1,power_law_1.2,1.4910016059875488
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,4,1,balanced,0.9382826487223307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,4,1,balanced,0.9405600229899088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,4,1,power_law_1.01,1.017311954498291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,4,1,power_law_1.01,1.0333312034606934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,4,1,power_law_1.2,1.0404864311218263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,4,1,power_law_1.2,1.0741503715515137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,8,1,balanced,0.8372000058492025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,8,1,balanced,0.8413386344909668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,8,1,power_law_1.01,0.8861120223999024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,8,1,power_law_1.01,0.8912447929382324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,8,1,power_law_1.2,0.9011072158813477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,4096,1536,8,128,8,1,power_law_1.2,0.9047295570373535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,1,balanced,6.856149037679036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,1,balanced,6.911482493082683
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,1,power_law_1.01,7.231161499023438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,1,power_law_1.01,7.329862213134765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,1,power_law_1.2,6.9394371032714846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,1,power_law_1.2,7.210111999511719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,2,balanced,3.5753227869669595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,2,balanced,3.754730542500814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,2,power_law_1.01,4.814873504638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,2,power_law_1.01,4.909292984008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,2,power_law_1.2,5.115539169311523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,2,power_law_1.2,5.236095809936524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,4,balanced,1.8880853652954102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,4,balanced,1.9025279680887859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,4,power_law_1.01,3.520703887939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,4,power_law_1.01,3.936640167236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,4,power_law_1.2,3.5176063537597657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,4,power_law_1.2,3.65810546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,8,balanced,1.1058560212453206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,8,balanced,1.118127981821696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,8,power_law_1.01,3.1447872161865233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,8,power_law_1.01,3.4127105712890624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,8,power_law_1.2,3.4626880645751954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,1,8,power_law_1.2,3.490732955932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,16,1,balanced,0.787226676940918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,16,1,balanced,0.7889066537221273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,16,1,power_law_1.01,0.7936448097229004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,16,1,power_law_1.01,0.794700813293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,16,1,power_law_1.2,0.7941696166992187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,16,1,power_law_1.2,0.7949247837066651
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,2,1,balanced,3.0097440083821616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,2,1,balanced,3.0803839365641275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,2,1,power_law_1.01,2.93819522857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,2,1,power_law_1.01,2.9735679626464844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,2,1,power_law_1.2,2.9989952087402343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,2,1,power_law_1.2,3.0259071350097657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,32,1,balanced,0.6537066698074341
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,32,1,balanced,0.6537653207778931
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,32,1,power_law_1.01,0.6563456058502197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,32,1,power_law_1.01,0.6579840183258057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,32,1,power_law_1.2,0.6582528114318847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,32,1,power_law_1.2,0.6593664169311524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,4,1,balanced,1.6644852956136067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,4,1,balanced,1.6713013648986816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,4,1,power_law_1.01,1.720217514038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,4,1,power_law_1.01,1.738924789428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,4,1,power_law_1.2,1.684659194946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,4,1,power_law_1.2,1.7177152633666992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,8,1,balanced,1.0851306915283203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,8,1,balanced,1.0862879753112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,8,1,power_law_1.01,1.1019519805908202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,8,1,power_law_1.01,1.106828784942627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,8,1,power_law_1.2,1.1042816162109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,16384,2,8,8,1,power_law_1.2,1.1094143867492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,1,balanced,3.7658507029215493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,1,balanced,3.7993812561035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,1,power_law_1.01,4.790252685546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,1,power_law_1.01,4.959603118896484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,1,power_law_1.2,5.145484924316406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,1,power_law_1.2,5.257113647460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,128,balanced,0.47597332795461017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,128,balanced,0.47628267606099445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,128,power_law_1.01,0.6030911922454834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,128,power_law_1.01,0.6153151988983154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,128,power_law_1.2,0.6974527835845947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,128,power_law_1.2,0.7183743953704834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,16,balanced,0.6220586697260538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,16,balanced,0.6237920125325521
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,16,power_law_1.01,0.921388816833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,16,power_law_1.01,0.9653056144714356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,16,power_law_1.2,1.0635392189025878
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,16,power_law_1.2,1.1019007682800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,2,balanced,1.9033493995666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,2,balanced,1.912453333536784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,2,power_law_1.01,3.172064018249512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,2,power_law_1.01,3.254713439941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,2,power_law_1.2,3.4671615600585937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,2,power_law_1.2,3.486783981323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,256,balanced,0.46778666973114014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,256,balanced,0.46908799807230633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,256,power_law_1.01,0.5513023853302002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,256,power_law_1.01,0.5552576065063477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,256,power_law_1.2,0.6714752197265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,256,power_law_1.2,0.6776127815246582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,32,balanced,0.5378453334172567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,32,balanced,0.5382506847381592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,32,power_law_1.01,0.7572415828704834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,32,power_law_1.01,0.7667391777038575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,32,power_law_1.2,0.8611968040466309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,32,power_law_1.2,0.8912575721740723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,4,balanced,1.148703972498576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,4,balanced,1.155461311340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,4,power_law_1.01,1.9664640426635742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,4,power_law_1.01,2.005459213256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,4,power_law_1.2,2.2704959869384767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,4,power_law_1.2,2.2975744247436523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,64,balanced,0.4968959887822469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,64,balanced,0.4979626735051473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,64,power_law_1.01,0.6312448024749756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,64,power_law_1.01,0.6540800094604492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,64,power_law_1.2,0.7525248050689697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,64,power_law_1.2,0.7602687835693359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,8,balanced,0.7947893142700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,8,balanced,0.7965760231018066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,8,power_law_1.01,1.3082752227783203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,8,power_law_1.01,1.3358464241027832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,8,power_law_1.2,1.442751979827881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,1,8,power_law_1.2,1.4868224143981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,16,1,balanced,1.0543306668599446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,16,1,balanced,1.055349349975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,16,1,power_law_1.01,1.1598464012145997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,16,1,power_law_1.01,1.1694272041320801
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,16,1,power_law_1.2,1.188697624206543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,16,1,power_law_1.2,1.202899169921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,2,1,balanced,2.0788532892862954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,2,1,balanced,2.1087466875712075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,2,1,power_law_1.01,2.7501440048217773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,2,1,power_law_1.01,2.801580810546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,2,1,power_law_1.2,2.9207040786743166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,2,1,power_law_1.2,2.9229055404663087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,32,1,balanced,1.0787519613901775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,32,1,balanced,1.0814773241678874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,32,1,power_law_1.01,1.1602432250976562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,32,1,power_law_1.01,1.1703807830810546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,32,1,power_law_1.2,1.1694144248962401
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,32,1,power_law_1.2,1.1916159629821776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,4,1,balanced,1.4590506553649902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,4,1,balanced,1.4670559565226238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,4,1,power_law_1.01,1.7657087326049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,4,1,power_law_1.01,1.8415487289428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,4,1,power_law_1.2,1.8822912216186523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,4,1,power_law_1.2,1.8995584487915038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,8,1,balanced,1.1718773047129314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,8,1,balanced,1.1733653545379639
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,8,1,power_law_1.01,1.339795207977295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,8,1,power_law_1.01,1.3558655738830567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,8,1,power_law_1.2,1.3803392410278321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2048,8,256,8,1,power_law_1.2,1.4028096199035645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,1,balanced,5.261509259541829
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,1,balanced,5.282453219095866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,1,power_law_1.01,5.1482688903808596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,1,power_law_1.01,5.157145690917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,1,power_law_1.2,5.363609695434571
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,1,power_law_1.2,5.5033729553222654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,16,balanced,0.7381920019785563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,16,balanced,0.7418506940205892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,16,power_law_1.01,1.0264063835144044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,16,power_law_1.01,1.0592448234558105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,16,power_law_1.2,1.1352831840515136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,16,power_law_1.2,1.3083840370178224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,2,balanced,2.67521603902181
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,2,balanced,2.745525360107422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,2,power_law_1.01,3.2202945709228517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,2,power_law_1.01,3.2350017547607424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,2,power_law_1.2,3.3719486236572265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,2,power_law_1.2,3.3965377807617188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,32,balanced,0.6041119893391927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,32,balanced,0.606879989306132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,32,power_law_1.01,0.8100095748901367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,32,power_law_1.01,0.8157376289367676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,32,power_law_1.2,0.9286463737487793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,32,power_law_1.2,1.0424192428588868
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,4,balanced,1.5519146919250488
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,4,balanced,1.5767466227213542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,4,power_law_1.01,1.991801643371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,4,power_law_1.01,2.013523292541504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,4,power_law_1.2,2.1607488632202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,4,power_law_1.2,2.205504035949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,8,balanced,1.0084319909413655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,8,balanced,1.0254933039347331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,8,power_law_1.01,1.293273639678955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,8,power_law_1.01,1.3376959800720214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,8,power_law_1.2,1.4458687782287598
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,1,8,power_law_1.2,1.5604096412658692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,2,1,balanced,2.9207468032836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,2,1,balanced,2.941221237182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,2,1,power_law_1.01,2.8820608139038084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,2,1,power_law_1.01,2.955257606506348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,2,1,power_law_1.2,2.952761650085449
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,2,1,power_law_1.2,2.9587711334228515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,4,1,balanced,1.8798027038574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,4,1,balanced,1.8968213399251301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,4,1,power_law_1.01,1.8918207168579102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,4,1,power_law_1.01,1.8999551773071288
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,4,1,power_law_1.2,1.9077568054199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,4,1,power_law_1.2,1.9412607192993163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,8,1,balanced,1.5062452952067058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,8,1,balanced,1.5177653630574544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,8,1,power_law_1.01,1.4874048233032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,8,1,power_law_1.01,1.4934016227722169
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,8,1,power_law_1.2,1.513753604888916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,6144,2560,8,160,8,1,power_law_1.2,1.5149567604064942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,1,balanced,3.990746815999349
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,1,balanced,4.329999923706055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,1,power_law_1.01,5.507872009277344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,1,power_law_1.01,5.758694458007812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,1,power_law_1.2,5.815507125854492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,1,power_law_1.2,5.887571334838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,128,balanced,0.5452213287353516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,128,balanced,0.5463200012842814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,128,power_law_1.01,0.6876671791076661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,128,power_law_1.01,0.6904704093933105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,128,power_law_1.2,0.8196672439575196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,128,power_law_1.2,0.8334591865539551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,16,balanced,0.7162559827168783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,16,balanced,0.7181440194447836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,16,power_law_1.01,1.0476991653442382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,16,power_law_1.01,1.0650176048278808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,16,power_law_1.2,1.2348031997680664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,16,power_law_1.2,1.2614463806152343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,2,balanced,2.2315573692321777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,2,balanced,2.245024045308431
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,2,power_law_1.01,3.5220542907714845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,2,power_law_1.01,3.540415954589844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,2,power_law_1.2,3.7189441680908204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,2,power_law_1.2,3.802854537963867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,256,balanced,0.5362346569697062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,256,balanced,0.5372159878412882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,256,power_law_1.01,0.6353792190551758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,256,power_law_1.01,0.6371200084686279
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,256,power_law_1.2,0.7549056053161621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,256,power_law_1.2,0.767148780822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,32,balanced,0.6171893278757731
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,32,balanced,0.6195306777954102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,32,power_law_1.01,0.8498687744140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,32,power_law_1.01,0.8632448196411133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,32,power_law_1.2,0.9842432022094727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,32,power_law_1.2,1.024358367919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,4,balanced,1.3345173199971516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,4,balanced,1.3417760531107585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,4,power_law_1.01,2.191756820678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,4,power_law_1.01,2.256275177001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,4,power_law_1.2,2.4793279647827147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,4,power_law_1.2,2.529465675354004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,64,balanced,0.570090651512146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,64,balanced,0.570522665977478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,64,power_law_1.01,0.7437952041625977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,64,power_law_1.01,0.7686336040496826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,64,power_law_1.2,0.8194751739501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,64,power_law_1.2,0.8507007598876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,8,balanced,0.9170933564503988
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,8,balanced,0.9208799997965494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,8,power_law_1.01,1.4361663818359376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,8,power_law_1.01,1.4730048179626465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,8,power_law_1.2,1.5509696006774902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,1,8,power_law_1.2,1.7426111221313476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,16,1,balanced,1.2213493188222249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,16,1,balanced,1.221509297688802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,16,1,power_law_1.01,1.3122048377990723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,16,1,power_law_1.01,1.330291175842285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,16,1,power_law_1.2,1.3394047737121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,16,1,power_law_1.2,1.3455039978027343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,2,1,balanced,2.412837346394857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,2,1,balanced,2.5134080251057944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,2,1,power_law_1.01,3.153990364074707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,2,1,power_law_1.01,3.1976255416870116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,2,1,power_law_1.2,3.2977664947509764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,2,1,power_law_1.2,3.298553466796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,32,1,balanced,1.2478666305541992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,32,1,balanced,1.2506720225016277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,32,1,power_law_1.01,1.3291328430175782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,32,1,power_law_1.01,1.368819236755371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,32,1,power_law_1.2,1.3654975891113281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,32,1,power_law_1.2,1.3708352088928222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,4,1,balanced,1.6982720692952473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,4,1,balanced,1.7095252672831218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,4,1,power_law_1.01,2.020863914489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,4,1,power_law_1.01,2.072870445251465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,4,1,power_law_1.2,2.09356803894043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,4,1,power_law_1.2,2.1258623123168947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,8,1,balanced,1.362496058146159
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,8,1,balanced,1.3628959655761719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,8,1,power_law_1.01,1.524339199066162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,8,1,power_law_1.01,1.541267204284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,8,1,power_law_1.2,1.6058048248291015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,256,8,1,power_law_1.2,1.6341440200805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,1,balanced,6.039221445719401
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,1,balanced,6.160757064819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,1,power_law_1.01,6.253785705566406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,1,power_law_1.01,6.264646530151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,1,power_law_1.2,6.889478302001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,1,power_law_1.2,6.919904327392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,128,balanced,0.5544906854629517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,128,balanced,0.5583839813868204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,128,power_law_1.01,0.6679679870605468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,128,power_law_1.01,0.6762879848480224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,128,power_law_1.2,0.7518527984619141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,128,power_law_1.2,0.7594751834869384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,16,balanced,0.8086240291595459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,16,balanced,0.8124213218688965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,16,power_law_1.01,1.0902463912963867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,16,power_law_1.01,1.116703987121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,16,power_law_1.2,1.2787903785705566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,16,power_law_1.2,1.2856703758239747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,2,balanced,2.974933306376139
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,2,balanced,3.039488156636556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,2,power_law_1.01,4.086643218994141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,2,power_law_1.01,4.101702499389648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,2,power_law_1.2,4.448921585083008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,2,power_law_1.2,4.576851272583008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,32,balanced,0.6669812997182211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,32,balanced,0.6674986680348715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,32,power_law_1.01,0.8824895858764649
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,32,power_law_1.01,0.8857088088989258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,32,power_law_1.2,0.9866047859191894
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,32,power_law_1.2,1.034118366241455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,4,balanced,1.5414560635884602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,4,balanced,1.6883734067281086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,4,power_law_1.01,2.497811126708984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,4,power_law_1.01,2.642201614379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,4,power_law_1.2,2.9198463439941404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,4,power_law_1.2,2.9753536224365233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,64,balanced,0.5946559906005859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,64,balanced,0.5993920167287191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,64,power_law_1.01,0.7357632160186768
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,64,power_law_1.01,0.7486144065856933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,64,power_law_1.2,0.8159808158874512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,64,power_law_1.2,0.8629504203796386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,8,balanced,1.1041706403096516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,8,balanced,1.1077866554260254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,8,power_law_1.01,1.6171455383300781
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,8,power_law_1.01,1.6317056655883788
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,8,power_law_1.2,1.881395149230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,1,8,power_law_1.2,1.9322687149047852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,16,1,balanced,1.345311959584554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,16,1,balanced,1.346336046854655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,16,1,power_law_1.01,1.3865216255187989
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,16,1,power_law_1.01,1.396243190765381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,16,1,power_law_1.2,1.4228351593017579
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,16,1,power_law_1.2,1.4382847785949706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,2,1,balanced,3.09169069925944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,2,1,balanced,3.3974666595458984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,2,1,power_law_1.01,3.4332862854003907
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,2,1,power_law_1.01,3.500851058959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,2,1,power_law_1.2,3.750182342529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,2,1,power_law_1.2,3.8639041900634767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,32,1,balanced,1.3302133083343506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,32,1,balanced,1.3330026467641194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,32,1,power_law_1.01,1.392467212677002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,32,1,power_law_1.01,1.407583999633789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,32,1,power_law_1.2,1.4208255767822267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,32,1,power_law_1.2,1.4608768463134765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,4,1,balanced,2.040880044301351
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,4,1,balanced,2.0483147303263345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,4,1,power_law_1.01,2.223174476623535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,4,1,power_law_1.01,2.2966079711914062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,4,1,power_law_1.2,2.3612991333007813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,4,1,power_law_1.2,2.3752384185791016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,8,1,balanced,1.559168020884196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,8,1,balanced,1.5646613438924153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,8,1,power_law_1.01,1.6149824142456055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,8,1,power_law_1.01,1.6338367462158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,8,1,power_law_1.2,1.718886375427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,16384,7168,2048,8,384,8,1,power_law_1.2,1.72674560546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,1,balanced,0.09676266709963481
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,1,balanced,0.09707732995351155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,1,power_law_1.01,0.09467520117759705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,1,power_law_1.01,0.09531520009040832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,1,power_law_1.2,0.09472000002861022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,1,power_law_1.2,0.09542400240898133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,128,balanced,0.03739733248949051
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,128,balanced,0.038218667109807335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,128,power_law_1.01,0.0351936012506485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,128,power_law_1.01,0.0354559987783432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,128,power_law_1.2,0.03423359990119934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,128,power_law_1.2,0.035046398639678955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,16,balanced,0.05406933526198069
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,16,balanced,0.05411200225353241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,16,power_law_1.01,0.0474047988653183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,16,power_law_1.01,0.04807040095329285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,16,power_law_1.2,0.04639999866485596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,16,power_law_1.2,0.046598398685455324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,2,balanced,0.05880533158779144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,2,balanced,0.05971199770768484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,2,power_law_1.01,0.059513598680496216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,2,power_law_1.01,0.0604095995426178
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,2,power_law_1.2,0.059673601388931276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,2,power_law_1.2,0.05973119735717773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,32,balanced,0.04563733438650767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,32,balanced,0.04584533472855886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,32,power_law_1.01,0.03986560106277466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,32,power_law_1.01,0.041119998693466185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,32,power_law_1.2,0.0387584000825882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,32,power_law_1.2,0.039059200882911684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,4,balanced,0.041482667128245033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,4,balanced,0.043935999274253845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,4,power_law_1.01,0.04260480105876922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,4,power_law_1.01,0.04434559941291809
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,4,power_law_1.2,0.04407039880752563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,4,power_law_1.2,0.04575999975204468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,64,balanced,0.039818666875362396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,64,balanced,0.03990400085846583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,64,power_law_1.01,0.036160001158714296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,64,power_law_1.01,0.037190398573875426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,64,power_law_1.2,0.03523840010166168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,64,power_law_1.2,0.03548159897327423
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,8,balanced,0.045312002301216125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,8,balanced,0.045328001181284584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,8,power_law_1.01,0.03722879886627197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,8,power_law_1.01,0.037401598691940305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,8,power_law_1.2,0.0379584014415741
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,1,8,power_law_1.2,0.03861759901046753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,2,1,balanced,0.07021866738796234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,2,1,balanced,0.07043733199437459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,2,1,power_law_1.01,0.06641280055046081
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,2,1,power_law_1.01,0.06763520240783691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,2,1,power_law_1.2,0.06638720035552978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,2,1,power_law_1.2,0.06811519861221313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,4,1,balanced,0.05445333321889242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,4,1,balanced,0.0565226674079895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,4,1,power_law_1.01,0.05295360088348389
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,4,1,power_law_1.01,0.055430400371551516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,4,1,power_law_1.2,0.05497599840164184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,2048,768,8,128,4,1,power_law_1.2,0.055353599786758426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,1,balanced,0.3197919925053914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,1,balanced,0.3203999996185303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,1,power_law_1.01,0.2813503980636597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,1,power_law_1.01,0.28152320384979246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,1,power_law_1.2,0.28954238891601564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,1,power_law_1.2,0.2932415962219238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,128,balanced,0.039733332892258964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,128,balanced,0.04132800052563349
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,128,power_law_1.01,0.0384768009185791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,128,power_law_1.01,0.039103999733924866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,128,power_law_1.2,0.0379967987537384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,128,power_law_1.2,0.03863039910793305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,16,balanced,0.07331199944019318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,16,balanced,0.07357333103815715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,16,power_law_1.01,0.06222720146179199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,16,power_law_1.01,0.06307839751243591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,16,power_law_1.2,0.057868802547454835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,16,power_law_1.2,0.0654911994934082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,2,balanced,0.17747199535369873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,2,balanced,0.17856534322102866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,2,power_law_1.01,0.1570304036140442
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,2,power_law_1.01,0.16110719442367555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,2,power_law_1.2,0.15831680297851564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,2,power_law_1.2,0.16353280544281007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,256,balanced,0.039850667119026184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,256,balanced,0.04050666590531667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,256,power_law_1.01,0.0378495991230011
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,256,power_law_1.01,0.03842560052871704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,256,power_law_1.2,0.03709439933300018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,256,power_law_1.2,0.03818239867687225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,32,balanced,0.08802133798599243
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,32,balanced,0.09270399808883667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,32,power_law_1.01,0.0768064022064209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,32,power_law_1.01,0.07835519909858704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,32,power_law_1.2,0.07760000228881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,32,power_law_1.2,0.08529919981956482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,4,balanced,0.1072160005569458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,4,balanced,0.10823466380437215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,4,power_law_1.01,0.09350399971008301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,4,power_law_1.01,0.09690880179405212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,4,power_law_1.2,0.09690880179405212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,4,power_law_1.2,0.09711359739303589
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,64,balanced,0.049925332268079124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,64,balanced,0.050053333242734276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,64,power_law_1.01,0.04678399860858917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,64,power_law_1.01,0.047635200619697574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,64,power_law_1.2,0.045491200685501096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,64,power_law_1.2,0.04635519981384277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,8,balanced,0.07336533566315968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,8,balanced,0.07374399900436401
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,8,power_law_1.01,0.06574079990386963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,8,power_law_1.01,0.06718080043792725
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,8,power_law_1.2,0.0690496027469635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,1,8,power_law_1.2,0.06934400200843811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,2,1,balanced,0.18077866236368814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,2,1,balanced,0.1811573306719462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,2,1,power_law_1.01,0.16594560146331788
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,2,1,power_law_1.01,0.16976640224456788
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,2,1,power_law_1.2,0.16963839530944824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,2,1,power_law_1.2,0.17044479846954347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,4,1,balanced,0.11551466584205627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,4,1,balanced,0.11675199866294861
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,4,1,power_law_1.01,0.10784640312194824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,4,1,power_law_1.01,0.10821759700775146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,4,1,power_law_1.2,0.1085312008857727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,4,1,power_law_1.2,0.10944000482559205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,8,1,balanced,0.08550399541854858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,8,1,balanced,0.08640000224113464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,8,1,power_law_1.01,0.08506879806518555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,8,1,power_law_1.01,0.0852288007736206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,8,1,power_law_1.2,0.08511360287666321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,3072,1536,8,256,8,1,power_law_1.2,0.08535040020942689
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,1,balanced,0.1964213252067566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,1,balanced,0.19710934162139893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,1,power_law_1.01,0.198636794090271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,1,power_law_1.01,0.2040895938873291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,1,power_law_1.2,0.20286719799041747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,1,power_law_1.2,0.20511360168457032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,2,balanced,0.10735999544461568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,2,balanced,0.1076853374640147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,2,power_law_1.01,0.12288000583648681
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,2,power_law_1.01,0.12899199724197388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,2,power_law_1.2,0.12081279754638671
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,2,power_law_1.2,0.13023359775543214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,4,balanced,0.20534932613372803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,4,balanced,0.20795732736587524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,4,power_law_1.01,0.11674239635467529
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,4,power_law_1.01,0.16800639629364014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,4,power_law_1.2,0.09595519900321961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,4,power_law_1.2,0.12632960081100464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,8,balanced,0.1474399964014689
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,8,balanced,0.1482080022493998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,8,power_law_1.01,0.11336959600448608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,8,power_law_1.01,0.11905280351638795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,8,power_law_1.2,0.09134079813957215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,1,8,power_law_1.2,0.12302720546722412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,16,1,balanced,0.04151466737190882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,16,1,balanced,0.0418453315893809
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,16,1,power_law_1.01,0.03991680145263672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,16,1,power_law_1.01,0.040780800580978396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,16,1,power_law_1.2,0.03975679874420166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,16,1,power_law_1.2,0.03989759981632233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,2,1,balanced,0.10898666580518086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,2,1,balanced,0.10986666878064473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,2,1,power_law_1.01,0.11553280353546143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,2,1,power_law_1.01,0.11731840372085571
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,2,1,power_law_1.2,0.11448320150375366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,2,1,power_law_1.2,0.11571199893951416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,32,1,balanced,0.035642666121323906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,32,1,balanced,0.03772799919048945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,32,1,power_law_1.01,0.03407999873161316
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,32,1,power_law_1.01,0.035020801424980166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,32,1,power_law_1.2,0.03441280126571655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,32,1,power_law_1.2,0.03522560000419617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,4,1,balanced,0.07297066847483318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,4,1,balanced,0.07508266468842824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,4,1,power_law_1.01,0.07339519858360291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,4,1,power_law_1.01,0.07373440265655518
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,4,1,power_law_1.2,0.07325440049171447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,4,1,power_law_1.2,0.07382400035858154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,8,1,balanced,0.0558186670144399
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,8,1,balanced,0.05605333546797434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,8,1,power_law_1.01,0.053574401140213015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,8,1,power_law_1.01,0.05421440005302429
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,8,1,power_law_1.2,0.054028797149658206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,14336,2,8,8,1,power_law_1.2,0.054092800617218016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,1,balanced,0.25919999678929645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,1,balanced,0.259770671526591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,1,power_law_1.01,0.26194560527801514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,1,power_law_1.01,0.2631808042526245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,1,power_law_1.2,0.2686527967453003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,1,power_law_1.2,0.26928000450134276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,128,balanced,0.041493333876132965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,128,balanced,0.04159466673930486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,128,power_law_1.01,0.03976320028305054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,128,power_law_1.01,0.04005120098590851
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,128,power_law_1.2,0.03978880047798157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,128,power_law_1.2,0.03997440040111542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,16,balanced,0.10737066467603047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,16,balanced,0.11347200473149617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,16,power_law_1.01,0.078438401222229
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,16,power_law_1.01,0.09537919759750366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,16,power_law_1.2,0.08543360233306885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,16,power_law_1.2,0.09028480052947999
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,2,balanced,0.13596266508102417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,2,balanced,0.1360426644484202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,2,power_law_1.01,0.13341439962387086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,2,power_law_1.01,0.13490560054779052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,2,power_law_1.2,0.13839999437332154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,2,power_law_1.2,0.13987200260162352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,32,balanced,0.047877331574757896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,32,balanced,0.048010667165120445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,32,power_law_1.01,0.04444800019264221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,32,power_law_1.01,0.044761601090431216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,32,power_law_1.2,0.04351359903812409
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,32,power_law_1.2,0.04445439875125885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,4,balanced,0.0872320036093394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,4,balanced,0.08781866232554118
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,4,power_law_1.01,0.08510079979896545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,4,power_law_1.01,0.08572800159454345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,4,power_law_1.2,0.08723199963569642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,4,power_law_1.2,0.08759679794311523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,64,balanced,0.04224533339341482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,64,balanced,0.04362666606903076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,64,power_law_1.01,0.040243199467658995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,64,power_law_1.01,0.04059520065784454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,64,power_law_1.2,0.04012799859046936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,64,power_law_1.2,0.040601599216461184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,8,balanced,0.08051200211048126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,8,balanced,0.08064533273379008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,8,power_law_1.01,0.06307200193405152
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,8,power_law_1.01,0.07103360295295716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,8,power_law_1.2,0.06881279945373535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,1,8,power_law_1.2,0.06935679912567139
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,2,1,balanced,0.16351466377576193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,2,1,balanced,0.16510933637619019
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,2,1,power_law_1.01,0.1611199975013733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,2,1,power_law_1.01,0.1622912049293518
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,2,1,power_law_1.2,0.16198400259017945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,2,1,power_law_1.2,0.16325119733810425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,4,1,balanced,0.10528000195821126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,4,1,balanced,0.1055413285891215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,4,1,power_law_1.01,0.10278400182723998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,4,1,power_law_1.01,0.10302079916000366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,4,1,power_law_1.2,0.10410239696502685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,4,1,power_law_1.2,0.10426239967346192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,8,1,balanced,0.08267199993133545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,8,1,balanced,0.08572266499201457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,8,1,power_law_1.01,0.08247039914131164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,8,1,power_law_1.01,0.08289920091629029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,8,1,power_law_1.2,0.08244479894638061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,4096,1536,8,128,8,1,power_law_1.2,0.08291199803352356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,1,balanced,0.38515734672546387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,1,balanced,0.38651732603708905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,1,power_law_1.01,0.3705280065536499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,1,power_law_1.01,0.3797375917434692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,1,power_law_1.2,0.3817728042602539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,1,power_law_1.2,0.3862272024154663
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,2,balanced,0.15843733151753744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,2,balanced,0.15848533312479654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,2,power_law_1.01,0.1982143998146057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,2,power_law_1.01,0.20639359951019287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,2,power_law_1.2,0.19427839517593384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,2,power_law_1.2,0.19685759544372558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,4,balanced,0.2675146659215291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,4,balanced,0.27331199248631793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,4,power_law_1.01,0.16920959949493408
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,4,power_law_1.01,0.1725759983062744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,4,power_law_1.2,0.16996480226516725
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,4,power_law_1.2,0.1896448016166687
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,8,balanced,0.16526933511098227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,8,balanced,0.16874132553736368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,8,power_law_1.01,0.155731201171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,8,power_law_1.01,0.15940480232238768
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,8,power_law_1.2,0.15758719444274902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,1,8,power_law_1.2,0.16172800064086915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,16,1,balanced,0.052613332867622375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,16,1,balanced,0.0539626677831014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,16,1,power_law_1.01,0.05137280225753784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,16,1,power_law_1.01,0.051641601324081424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,16,1,power_law_1.2,0.05101439952850342
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,16,1,power_law_1.2,0.05103999972343445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,2,1,balanced,0.1605226695537567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,2,1,balanced,0.16089066863059998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,2,1,power_law_1.01,0.17141120433807372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,2,1,power_law_1.01,0.1743872046470642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,2,1,power_law_1.2,0.17147519588470458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,2,1,power_law_1.2,0.17369600534439086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,32,1,balanced,0.04005866746107737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,32,1,balanced,0.04090133309364319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,32,1,power_law_1.01,0.0374208003282547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,32,1,power_law_1.01,0.03875199854373932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,32,1,power_law_1.2,0.038624000549316403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,32,1,power_law_1.2,0.03919360041618347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,4,1,balanced,0.09967466195424397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,4,1,balanced,0.09993066390355428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,4,1,power_law_1.01,0.10370559692382812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,4,1,power_law_1.01,0.10576000213623046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,4,1,power_law_1.2,0.10317440032958984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,4,1,power_law_1.2,0.10512640476226806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,8,1,balanced,0.06832533578077953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,8,1,balanced,0.06919999917348225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,8,1,power_law_1.01,0.06854400038719177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,8,1,power_law_1.01,0.0694208025932312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,8,1,power_law_1.2,0.06852480173110961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,16384,2,8,8,1,power_law_1.2,0.0689408004283905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,1,balanced,0.7886346975962321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,1,balanced,0.7895840009053549
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,1,power_law_1.01,0.7106751918792724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,1,power_law_1.01,0.7151167869567872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,1,power_law_1.2,0.7112512111663818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,1,power_law_1.2,0.7324672222137452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,128,balanced,0.050944000482559204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,128,balanced,0.058186665177345276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,128,power_law_1.01,0.050316798686981204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,128,power_law_1.01,0.05052800178527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,128,power_law_1.2,0.049958398938179015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,128,power_law_1.2,0.05507199764251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,16,balanced,0.1253600021203359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,16,balanced,0.12613866726557413
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,16,power_law_1.01,0.10360959768295289
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,16,power_law_1.01,0.10381439924240113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,16,power_law_1.2,0.09343360066413879
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,16,power_law_1.2,0.09721599817276001
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,2,balanced,0.4115786552429199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,2,balanced,0.41265066464742023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,2,power_law_1.01,0.3723200082778931
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,2,power_law_1.01,0.37701759338378904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,2,power_law_1.2,0.3802560091018677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,2,power_law_1.2,0.39232640266418456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,256,balanced,0.04588800172011057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,256,balanced,0.04729066789150238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,256,power_law_1.01,0.04407680034637451
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,256,power_law_1.01,0.046649599075317384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,256,power_law_1.2,0.043750399351119997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,256,power_law_1.2,0.04387840032577515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,32,balanced,0.18581867218017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,32,balanced,0.19516799847284952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,32,power_law_1.01,0.16009600162506105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,32,power_law_1.01,0.17957119941711425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,32,power_law_1.2,0.1564095973968506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,32,power_law_1.2,0.15648000240325927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,4,balanced,0.22761066754659018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,4,balanced,0.22777066628138223
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,4,power_law_1.01,0.1966976046562195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,4,power_law_1.01,0.20908799171447753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,4,power_law_1.2,0.20531840324401857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,4,power_law_1.2,0.21288321018218995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,64,balanced,0.0865119993686676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,64,balanced,0.08995733658472697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,64,power_law_1.01,0.07622399926185608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,64,power_law_1.01,0.07788159847259521
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,64,power_law_1.2,0.07204480171203613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,64,power_law_1.2,0.07511039972305297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,8,balanced,0.1378506620724996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,8,balanced,0.1379039982954661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,8,power_law_1.01,0.12195839881896972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,8,power_law_1.01,0.12490880489349365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,8,power_law_1.2,0.12314239740371705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,1,8,power_law_1.2,0.13031680583953859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,16,1,balanced,0.11566399534543355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,16,1,balanced,0.11568533380826314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,16,1,power_law_1.01,0.11823359727859498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,16,1,power_law_1.01,0.11844480037689209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,16,1,power_law_1.2,0.1189695954322815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,16,1,power_law_1.2,0.12060799598693847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,2,1,balanced,0.41656001408894855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,2,1,balanced,0.4168533484141032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,2,1,power_law_1.01,0.3663487911224365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,2,1,power_law_1.01,0.37411839962005616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,2,1,power_law_1.2,0.37896320819854734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,2,1,power_law_1.2,0.3793600082397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,32,1,balanced,0.09847467144330342
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,32,1,balanced,0.09894399841626485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,32,1,power_law_1.01,0.10522240400314331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,32,1,power_law_1.01,0.10526080131530761
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,32,1,power_law_1.2,0.10551040172576905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,32,1,power_law_1.2,0.10610560178756714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,4,1,balanced,0.23537067572275797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,4,1,balanced,0.2353973388671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,4,1,power_law_1.01,0.21507198810577394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,4,1,power_law_1.01,0.21831679344177246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,4,1,power_law_1.2,0.21422719955444336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,4,1,power_law_1.2,0.21767039299011232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,8,1,balanced,0.15033066272735596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,8,1,balanced,0.15038399895032248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,8,1,power_law_1.01,0.14590079784393312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,8,1,power_law_1.01,0.14602880477905272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,8,1,power_law_1.2,0.1480512022972107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2048,8,256,8,1,power_law_1.2,0.14914560317993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,1,balanced,0.7132213115692139
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,1,balanced,0.7149759928385416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,1,power_law_1.01,0.6745984077453613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,1,power_law_1.01,0.6774655818939209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,1,power_law_1.2,0.7024960041046142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,1,power_law_1.2,0.7056831836700439
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,16,balanced,0.24984000126520792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,16,balanced,0.25165865818659466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,16,power_law_1.01,0.20396800041198732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,16,power_law_1.01,0.20888960361480713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,16,power_law_1.2,0.19216639995574952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,16,power_law_1.2,0.20730879306793212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,2,balanced,0.3365066846211751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,2,balanced,0.33712534109751385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,2,power_law_1.01,0.3244607925415039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,2,power_law_1.01,0.3245503902435303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,2,power_law_1.2,0.3373055934906006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,2,power_law_1.2,0.33882238864898684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,32,balanced,0.1527839998404185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,32,balanced,0.15482133626937866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,32,power_law_1.01,0.12425600290298462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,32,power_law_1.01,0.13070080280303956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,32,power_law_1.2,0.11284480094909669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,32,power_law_1.2,0.11689599752426147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,4,balanced,0.18918933471043906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,4,balanced,0.1895786722501119
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,4,power_law_1.01,0.1814144015312195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,4,power_law_1.01,0.18562560081481932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,4,power_law_1.2,0.1767359972000122
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,4,power_law_1.2,0.1878399968147278
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,8,balanced,0.16503467162450156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,8,balanced,0.17590399583180746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,8,power_law_1.01,0.14032000303268433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,8,power_law_1.01,0.1453760027885437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,8,power_law_1.2,0.12554880380630493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,1,8,power_law_1.2,0.12938239574432372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,2,1,balanced,0.39371200402577716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,2,1,balanced,0.3943893512090047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,2,1,power_law_1.01,0.35720961093902587
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,2,1,power_law_1.01,0.37114880084991453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,2,1,power_law_1.2,0.37432959079742434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,2,1,power_law_1.2,0.3793600082397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,4,1,balanced,0.2505439917246501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,4,1,balanced,0.25092266003290814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,4,1,power_law_1.01,0.2256319999694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,4,1,power_law_1.01,0.22565760612487792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,4,1,power_law_1.2,0.2286144018173218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,4,1,power_law_1.2,0.22941439151763915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,8,1,balanced,0.15289599696795145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,8,1,balanced,0.1530400017897288
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,8,1,power_law_1.01,0.1384511947631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,8,1,power_law_1.01,0.13933440446853637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,8,1,power_law_1.2,0.14137599468231202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,6144,2560,8,160,8,1,power_law_1.2,0.142086398601532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,1,balanced,0.9150346914927164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,1,balanced,0.9159946441650391
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,1,power_law_1.01,0.816160011291504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,1,power_law_1.01,0.8165311813354492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,1,power_law_1.2,0.8339008331298828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,1,power_law_1.2,0.8518464088439941
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,128,balanced,0.05798399945100149
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,128,balanced,0.06039999922116598
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,128,power_law_1.01,0.05616639852523804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,128,power_law_1.01,0.057222402095794676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,128,power_law_1.2,0.05440639853477478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,128,power_law_1.2,0.05548160076141358
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,16,balanced,0.13261333107948303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,16,balanced,0.13539200027783713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,16,power_law_1.01,0.10807039737701415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,16,power_law_1.01,0.11490559577941895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,16,power_law_1.2,0.10578559637069702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,16,power_law_1.2,0.10713599920272827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,2,balanced,0.4774186611175537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,2,balanced,0.4788000186284383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,2,power_law_1.01,0.42894721031188965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,2,power_law_1.01,0.4323584079742432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,2,power_law_1.2,0.45267839431762696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,2,power_law_1.2,0.46517119407653806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,256,balanced,0.050010666251182556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,256,balanced,0.052154665191968284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,256,power_law_1.01,0.046803200244903566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,256,power_law_1.01,0.04772480130195618
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,256,power_law_1.2,0.04708479940891266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,256,power_law_1.2,0.04738560020923614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,32,balanced,0.2107200026512146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,32,balanced,0.22130666176478067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,32,power_law_1.01,0.18186880350112916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,32,power_law_1.01,0.20147840976715087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,32,power_law_1.2,0.17900160551071168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,32,power_law_1.2,0.1878399968147278
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,4,balanced,0.26206932465235394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,4,balanced,0.26427199443181354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,4,power_law_1.01,0.23376638889312745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,4,power_law_1.01,0.23720960617065429
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,4,power_law_1.2,0.23994879722595214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,4,power_law_1.2,0.24490880966186523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,64,balanced,0.09877866506576538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,64,balanced,0.10285333792368571
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,64,power_law_1.01,0.08488320112228394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,64,power_law_1.01,0.089055997133255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,64,power_law_1.2,0.08575999736785889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,64,power_law_1.2,0.08589439988136291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,8,balanced,0.156549334526062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,8,balanced,0.1565600037574768
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,8,power_law_1.01,0.1375040054321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,8,power_law_1.01,0.14604159593582153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,8,power_law_1.2,0.1404736042022705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,1,8,power_law_1.2,0.14710400104522706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,16,1,balanced,0.13327466448148093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,16,1,balanced,0.13474133610725403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,16,1,power_law_1.01,0.13530880212783813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,16,1,power_law_1.01,0.13653119802474975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,16,1,power_law_1.2,0.13745280504226684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,16,1,power_law_1.2,0.1383296012878418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,2,1,balanced,0.4829920132954915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,2,1,balanced,0.4843999942143758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,2,1,power_law_1.01,0.43067522048950196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,2,1,power_law_1.01,0.4345600128173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,2,1,power_law_1.2,0.4320703983306885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,2,1,power_law_1.2,0.43281922340393064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,32,1,balanced,0.11314133803049724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,32,1,balanced,0.1132533351580302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,32,1,power_law_1.01,0.11973119974136352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,32,1,power_law_1.01,0.11981439590454102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,32,1,power_law_1.2,0.12071039676666259
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,32,1,power_law_1.2,0.12106239795684814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,4,1,balanced,0.27246934175491333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,4,1,balanced,0.2733599940935771
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,4,1,power_law_1.01,0.25012478828430174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,4,1,power_law_1.01,0.2506432056427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,4,1,power_law_1.2,0.2514624118804932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,4,1,power_law_1.2,0.25276799201965333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,8,1,balanced,0.17194666465123495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,8,1,balanced,0.17550933361053467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,8,1,power_law_1.01,0.1679744005203247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,8,1,power_law_1.01,0.1687999963760376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,8,1,power_law_1.2,0.16921600103378295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,256,8,1,power_law_1.2,0.17020800113677978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,1,balanced,1.3447893460591633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,1,balanced,1.3454933166503906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,1,power_law_1.01,1.076352024078369
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,1,power_law_1.01,1.0765376091003418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,1,power_law_1.2,1.076518440246582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,1,power_law_1.2,1.0898303985595703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,128,balanced,0.08283733328183492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,128,balanced,0.08461333314577739
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,128,power_law_1.01,0.07723519802093506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,128,power_law_1.01,0.07803519964218139
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,128,power_law_1.2,0.07062399983406067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,128,power_law_1.2,0.07720959782600403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,16,balanced,0.13169599572817484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,16,balanced,0.13171199957529703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,16,power_law_1.01,0.11128319501876831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,16,power_law_1.01,0.11640959978103638
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,16,power_law_1.2,0.11113599538803101
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,16,power_law_1.2,0.12050559520721435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,2,balanced,0.6917706330617269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,2,balanced,0.6919786930084229
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,2,power_law_1.01,0.5622975826263428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,2,power_law_1.01,0.5769216060638428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,2,power_law_1.2,0.5492288112640381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,2,power_law_1.2,0.5682688236236573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,32,balanced,0.11534399787584941
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,32,balanced,0.11858133474985759
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,32,power_law_1.01,0.09051520228385926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,32,power_law_1.01,0.09715200066566468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,32,power_law_1.2,0.0902079999446869
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,32,power_law_1.2,0.10030080080032348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,4,balanced,0.36606399218241376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,4,balanced,0.36666667461395264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,4,power_law_1.01,0.31173760890960694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,4,power_law_1.01,0.31372799873352053
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,4,power_law_1.2,0.30458879470825195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,4,power_law_1.2,0.32025599479675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,64,balanced,0.16743467251459757
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,64,balanced,0.1732906699180603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,64,power_law_1.01,0.14704639911651612
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,64,power_law_1.01,0.16069120168685913
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,64,power_law_1.2,0.14566400051116943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,64,power_law_1.2,0.14687360525131227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,8,balanced,0.20677866538365683
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,8,balanced,0.20865599314371744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,8,power_law_1.01,0.16807680130004882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,8,power_law_1.01,0.1748095989227295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,8,power_law_1.2,0.17932159900665284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,1,8,power_law_1.2,0.1811519980430603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,16,1,balanced,0.17345066865285239
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,16,1,balanced,0.17491199572881064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,16,1,power_law_1.01,0.16110080480575562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,16,1,power_law_1.01,0.161190402507782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,16,1,power_law_1.2,0.16094720363616943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,16,1,power_law_1.2,0.161190402507782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,2,1,balanced,0.69706130027771
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,2,1,balanced,0.6973546346028646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,2,1,power_law_1.01,0.5562367916107178
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,2,1,power_law_1.01,0.566323184967041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,2,1,power_law_1.2,0.5535999774932862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,2,1,power_law_1.2,0.5567359924316406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,32,1,balanced,0.14380799730618796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,32,1,balanced,0.1448746621608734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,32,1,power_law_1.01,0.1370303988456726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,32,1,power_law_1.01,0.13791999816894532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,32,1,power_law_1.2,0.13605120182037353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,32,1,power_law_1.2,0.13757439851760864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,4,1,balanced,0.3798240025838216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,4,1,balanced,0.38011733690897626
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,4,1,power_law_1.01,0.3084223985671997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,4,1,power_law_1.01,0.31191680431365965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,4,1,power_law_1.2,0.31090559959411623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,4,1,power_law_1.2,0.31731839179992677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,8,1,balanced,0.23061333100001016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,8,1,balanced,0.23173866669336954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,8,1,power_law_1.01,0.20324480533599854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,8,1,power_law_1.01,0.2054975986480713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,8,1,power_law_1.2,0.20465281009674072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,192,7168,2048,8,384,8,1,power_law_1.2,0.2046976089477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,1,balanced,0.029370665550231934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,1,balanced,0.02938666691382726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,1,power_law_1.01,0.0289792001247406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,1,power_law_1.01,0.029734399914741517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,1,power_law_1.2,0.028255999088287354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,1,power_law_1.2,0.028940799832344054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,128,balanced,0.023370665808518726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,128,balanced,0.025231999655564625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,128,power_law_1.01,0.02176000028848648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,128,power_law_1.01,0.023206399381160737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,128,power_law_1.2,0.021593600511550903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,128,power_law_1.2,0.021881599724292756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,16,balanced,0.0230880007147789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,16,balanced,0.02310933421055476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,16,power_law_1.01,0.02333440035581589
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,16,power_law_1.01,0.023520000278949738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,16,power_law_1.2,0.022809599339962006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,16,power_law_1.2,0.023219199478626253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,2,balanced,0.02731200059254964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,2,balanced,0.02749866743882497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,2,power_law_1.01,0.02653439939022064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,2,power_law_1.01,0.028172799944877626
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,2,power_law_1.2,0.027027198672294618
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,2,power_law_1.2,0.027404800057411194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,32,balanced,0.023402666052182514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,32,balanced,0.025263999899228413
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,32,power_law_1.01,0.02325119972229004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,32,power_law_1.01,0.023558400571346283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,32,power_law_1.2,0.02136320024728775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,32,power_law_1.2,0.022457599639892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,4,balanced,0.025493333737055462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,4,balanced,0.026026666164398193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,4,power_law_1.01,0.026470398902893065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,4,power_law_1.01,0.027692800760269164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,4,power_law_1.2,0.024639999866485594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,4,power_law_1.2,0.025446400046348572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,64,balanced,0.023311999936898548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,64,balanced,0.025146665672461193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,64,power_law_1.01,0.022015999257564544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,64,power_law_1.01,0.02378239929676056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,64,power_law_1.2,0.021823999285697938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,64,power_law_1.2,0.021875199675559998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,8,balanced,0.025445332129796345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,8,balanced,0.025487999121348064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,8,power_law_1.01,0.02540160119533539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,8,power_law_1.01,0.025964799523353576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,8,power_law_1.2,0.026208001375198364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,1,8,power_law_1.2,0.02691200077533722
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,2,1,balanced,0.025775998830795288
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,2,1,balanced,0.02714666724205017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,2,1,power_law_1.01,0.025388801097869874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,2,1,power_law_1.01,0.026105600595474242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,2,1,power_law_1.2,0.024422399699687958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,2,1,power_law_1.2,0.024959999322891235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,4,1,balanced,0.025216000775496166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,4,1,balanced,0.025279998779296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,4,1,power_law_1.01,0.023507200181484222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,4,1,power_law_1.01,0.023999999463558196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,4,1,power_law_1.2,0.023737600445747374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,2048,768,8,128,4,1,power_law_1.2,0.024160000681877136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,1,balanced,0.044810667634010315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,1,balanced,0.0454720010360082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,1,power_law_1.01,0.045747199654579164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,1,power_law_1.01,0.04695680141448975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,1,power_law_1.2,0.04526079893112182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,1,power_law_1.2,0.04708479940891266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,128,balanced,0.02496533344189326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,128,balanced,0.025114665428797405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,128,power_law_1.01,0.02328319996595383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,128,power_law_1.01,0.023423999547958374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,128,power_law_1.2,0.022995199263095855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,128,power_law_1.2,0.02322559952735901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,16,balanced,0.025439999997615814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,16,balanced,0.025514667232831318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,16,power_law_1.01,0.04609920084476471
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,16,power_law_1.01,0.04663679897785187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,16,power_law_1.2,0.0452672004699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,16,power_law_1.2,0.046054399013519286
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,2,balanced,0.029333333174387615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,2,balanced,0.03123733401298523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,2,power_law_1.01,0.04550400078296661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,2,power_law_1.01,0.04565120041370392
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,2,power_law_1.2,0.04520959854125976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,2,power_law_1.2,0.045817598700523376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,256,balanced,0.025455998877684276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,256,balanced,0.027280000348885853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,256,power_law_1.01,0.022950400412082673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,256,power_law_1.01,0.0237184002995491
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,256,power_law_1.2,0.022655999660491942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,256,power_law_1.2,0.023193599283695222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,32,balanced,0.02588266630967458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,32,balanced,0.027482666075229645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,32,power_law_1.01,0.027897599339485168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,32,power_law_1.01,0.0302592009305954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,32,power_law_1.2,0.028774398565292358
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,32,power_law_1.2,0.028832000494003297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,4,balanced,0.02716800073782603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,4,balanced,0.02735466758410136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,4,power_law_1.01,0.04620159864425659
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,4,power_law_1.01,0.04629760086536407
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,4,power_law_1.2,0.04580479860305786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,4,power_law_1.2,0.045977601408958436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,64,balanced,0.024442667762438457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,64,balanced,0.02513066679239273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,64,power_law_1.01,0.02409600019454956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,64,power_law_1.01,0.025939199328422546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,64,power_law_1.2,0.02467840015888214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,64,power_law_1.2,0.02475520074367523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,8,balanced,0.026464000344276428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,8,balanced,0.027535999814669292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,8,power_law_1.01,0.046028798818588255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,8,power_law_1.01,0.04669440090656281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,8,power_law_1.2,0.044633600115776065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,1,8,power_law_1.2,0.04531840085983276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,2,1,balanced,0.03054400036732356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,2,1,balanced,0.03229333211978277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,2,1,power_law_1.01,0.028646400570869444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,2,1,power_law_1.01,0.030924800038337707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,2,1,power_law_1.2,0.029734399914741517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,2,1,power_law_1.2,0.03043839931488037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,4,1,balanced,0.0273333340883255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,4,1,balanced,0.027429332335789997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,4,1,power_law_1.01,0.025964799523353576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,4,1,power_law_1.01,0.025971201062202454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,4,1,power_law_1.2,0.025939199328422546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,4,1,power_law_1.2,0.027609598636627198
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,8,1,balanced,0.026949333647886913
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,8,1,balanced,0.027258666853109997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,8,1,power_law_1.01,0.024639999866485594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,8,1,power_law_1.01,0.025920000672340394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,8,1,power_law_1.2,0.024825599789619446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,3072,1536,8,256,8,1,power_law_1.2,0.026259198784828186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,1,balanced,0.08588266372680664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,1,balanced,0.0860053300857544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,1,power_law_1.01,0.07207040190696716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,1,power_law_1.01,0.07390720248222352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,1,power_law_1.2,0.07034879922866821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,1,power_law_1.2,0.07491199970245362
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,2,balanced,0.05816533168156942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,2,balanced,0.06029333174228668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,2,power_law_1.01,0.05395200252532959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,2,power_law_1.01,0.06287360191345215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,2,power_law_1.2,0.06113280057907104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,2,power_law_1.2,0.06446080207824707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,4,balanced,0.03957866628964742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,4,balanced,0.039642666776975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,4,power_law_1.01,0.05175679922103882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,4,power_law_1.01,0.052857601642608644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,4,power_law_1.2,0.04764159917831421
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,4,power_law_1.2,0.051648002862930295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,8,balanced,0.04251199960708618
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,8,balanced,0.04370133578777313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,8,power_law_1.01,0.03975679874420166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,8,power_law_1.01,0.04234879910945892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,8,power_law_1.2,0.03927040100097656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,1,8,power_law_1.2,0.04281600117683411
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,16,1,balanced,0.02735999971628189
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,16,1,balanced,0.02749866743882497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,16,1,power_law_1.01,0.02412160038948059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,16,1,power_law_1.01,0.026348799467086792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,16,1,power_law_1.2,0.024742400646209715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,16,1,power_law_1.2,0.02492160052061081
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,2,1,balanced,0.05682133138179779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,2,1,balanced,0.05750399827957153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,2,1,power_law_1.01,0.04583039879798889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,2,1,power_law_1.01,0.052243202924728394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,2,1,power_law_1.2,0.049439999461174014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,2,1,power_law_1.2,0.0511680006980896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,32,1,balanced,0.025392000873883564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,32,1,balanced,0.0271573339899381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,32,1,power_law_1.01,0.02423039972782135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,32,1,power_law_1.01,0.025785601139068602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,32,1,power_law_1.2,0.02420479953289032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,32,1,power_law_1.2,0.025817599892616273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,4,1,balanced,0.03760000069936117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,4,1,balanced,0.03823466598987579
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,4,1,power_law_1.01,0.031673601269721983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,4,1,power_law_1.01,0.03560320138931274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,4,1,power_law_1.2,0.03480960130691528
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,4,1,power_law_1.2,0.035724800825119016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,8,1,balanced,0.027349332968393963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,8,1,balanced,0.02735466758410136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,8,1,power_law_1.01,0.02648319900035858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,8,1,power_law_1.01,0.027449598908424376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,8,1,power_law_1.2,0.026752001047134398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,14336,2,8,8,1,power_law_1.2,0.027193599939346315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,1,balanced,0.05328000088532766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,1,balanced,0.054042667150497437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,1,power_law_1.01,0.051712000370025636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,1,power_law_1.01,0.05219200253486633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,1,power_law_1.2,0.05246719717979431
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,1,power_law_1.2,0.05260800123214722
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,128,balanced,0.02548266698916753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,128,balanced,0.02722666660944621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,128,power_law_1.01,0.02540160119533539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,128,power_law_1.01,0.025593599677085875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,128,power_law_1.2,0.024294400215148927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,128,power_law_1.2,0.025696000456809996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,16,balanced,0.025861332813898723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,16,balanced,0.026346666117509205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,16,power_law_1.01,0.031206399202346802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,16,power_law_1.01,0.031737598776817325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,16,power_law_1.2,0.03149439990520477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,16,power_law_1.2,0.03155199885368347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,2,balanced,0.03141866624355316
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,2,balanced,0.0354666660229365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,2,power_law_1.01,0.04535039961338043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,2,power_law_1.01,0.04814079999923706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,2,power_law_1.2,0.04451839923858643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,2,power_law_1.2,0.04556800127029419
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,32,balanced,0.025199999411900837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,32,balanced,0.025285333395004272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,32,power_law_1.01,0.025740799307823182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,32,power_law_1.01,0.025939199328422546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,32,power_law_1.2,0.025536000728607178
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,32,power_law_1.2,0.025727999210357667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,4,balanced,0.027957332630952198
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,4,balanced,0.02940266579389572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,4,power_law_1.01,0.03891839981079102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,4,power_law_1.01,0.04317440092563629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,4,power_law_1.2,0.039443200826644896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,4,power_law_1.2,0.04227199852466583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,64,balanced,0.02532800038655599
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,64,balanced,0.027210667729377747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,64,power_law_1.01,0.023827199637889863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,64,power_law_1.01,0.025625601410865784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,64,power_law_1.2,0.023680000007152556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,64,power_law_1.2,0.02542720139026642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,8,balanced,0.02720533311367035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,8,balanced,0.02735999971628189
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,8,power_law_1.01,0.03878400027751923
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,8,power_law_1.01,0.04305280148983002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,8,power_law_1.2,0.03356159925460815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,1,8,power_law_1.2,0.03454720079898834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,2,1,balanced,0.03345066557327906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,2,1,balanced,0.03547733277082443
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,2,1,power_law_1.01,0.036575999855995175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,2,1,power_law_1.01,0.03702400028705597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,2,1,power_law_1.2,0.03723520040512085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,2,1,power_law_1.2,0.03797760009765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,4,1,balanced,0.029167999823888142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,4,1,balanced,0.029482667644818623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,4,1,power_law_1.01,0.027577599883079527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,4,1,power_law_1.01,0.02778240144252777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,4,1,power_law_1.2,0.028255999088287354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,4,1,power_law_1.2,0.029254400730133058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,8,1,balanced,0.0273333340883255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,8,1,balanced,0.029445332785447437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,8,1,power_law_1.01,0.027327999472618103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,8,1,power_law_1.01,0.027340799570083618
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,8,1,power_law_1.2,0.026412799954414368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,4096,1536,8,128,8,1,power_law_1.2,0.027596798539161683
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,1,balanced,0.12781332929929098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,1,balanced,0.12788266936937967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,1,power_law_1.01,0.11094399690628051
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,1,power_law_1.01,0.11541119813919068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,1,power_law_1.2,0.09948800206184387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,1,power_law_1.2,0.1058303952217102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,2,balanced,0.0783733328183492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,2,balanced,0.08060266574223836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,2,power_law_1.01,0.0822655975818634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,2,power_law_1.01,0.09476479887962341
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,2,power_law_1.2,0.06938239932060242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,2,power_law_1.2,0.07329919934272766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,4,balanced,0.0558240016301473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,4,balanced,0.055871998270352684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,4,power_law_1.01,0.066975998878479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,4,power_law_1.01,0.07357439994812012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,4,power_law_1.2,0.06000000238418579
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,4,power_law_1.2,0.0639360010623932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,8,balanced,0.054602667689323425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,8,balanced,0.05606933434804281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,8,power_law_1.01,0.05315200090408325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,8,power_law_1.01,0.05414400100708008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,8,power_law_1.2,0.05414400100708008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,1,8,power_law_1.2,0.05432959794998169
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,16,1,balanced,0.02735999971628189
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,16,1,balanced,0.027984000742435455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,16,1,power_law_1.01,0.02773759961128235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,16,1,power_law_1.01,0.02805120050907135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,16,1,power_law_1.2,0.026662400364875792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,16,1,power_law_1.2,0.02852480113506317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,2,1,balanced,0.07825600107510884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,2,1,balanced,0.07999466856320699
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,2,1,power_law_1.01,0.06903039813041686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,2,1,power_law_1.01,0.07059199810028076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,2,1,power_law_1.2,0.06600319743156433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,2,1,power_law_1.2,0.06640639901161194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,32,1,balanced,0.02712533374627431
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,32,1,balanced,0.029370665550231934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,32,1,power_law_1.01,0.026815998554229736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,32,1,power_law_1.01,0.027577599883079527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,32,1,power_law_1.2,0.0255295991897583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,32,1,power_law_1.2,0.025887998938560485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,4,1,balanced,0.05444799860318502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,4,1,balanced,0.05584533512592316
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,4,1,power_law_1.01,0.04752640128135681
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,4,1,power_law_1.01,0.05203199982643127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,4,1,power_law_1.2,0.047603198885917665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,4,1,power_law_1.2,0.04832000136375427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,8,1,balanced,0.035616000493367515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,8,1,balanced,0.035674666364987694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,8,1,power_law_1.01,0.031404799222946166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,8,1,power_law_1.01,0.031974399089813234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,8,1,power_law_1.2,0.031385600566864014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,16384,2,8,8,1,power_law_1.2,0.03344640135765076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,1,balanced,0.07653333246707916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,1,balanced,0.07820799946784973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,1,power_law_1.01,0.07434239983558655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,1,power_law_1.01,0.07576320171356202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,1,power_law_1.2,0.07596160173416137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,1,power_law_1.2,0.07624959945678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,128,balanced,0.027477333943049114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,128,balanced,0.02749866743882497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,128,power_law_1.01,0.02595199942588806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,128,power_law_1.01,0.02805120050907135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,128,power_law_1.2,0.02595199942588806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,128,power_law_1.2,0.026636800169944762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,16,balanced,0.029391999046007793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,16,balanced,0.03028800090154012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,16,power_law_1.01,0.07418879866600037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,16,power_law_1.01,0.07594239711761475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,16,power_law_1.2,0.07396479845046997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,16,power_law_1.2,0.07541120052337646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,2,balanced,0.05366399884223938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,2,balanced,0.05390933156013489
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,2,power_law_1.01,0.07511039972305297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,2,power_law_1.01,0.07578240036964416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,2,power_law_1.2,0.07345920205116271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,2,power_law_1.2,0.07556480169296265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,256,balanced,0.02740799884001414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,256,balanced,0.02752533306678136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,256,power_law_1.01,0.025472000241279602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,256,power_law_1.01,0.027372801303863527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,256,power_law_1.2,0.02558079957962036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,256,power_law_1.2,0.02590720057487488
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,32,balanced,0.027717334528764088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,32,balanced,0.029493334392706554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,32,power_law_1.01,0.05135359764099121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,32,power_law_1.01,0.05183359980583191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,32,power_law_1.2,0.051737600564956666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,32,power_law_1.2,0.05246719717979431
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,4,balanced,0.03369066615899404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,4,balanced,0.035536001125971474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,4,power_law_1.01,0.0760703980922699
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,4,power_law_1.01,0.07607679963111877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,4,power_law_1.2,0.07409279942512512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,4,power_law_1.2,0.07472000122070313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,64,balanced,0.029322666426499683
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,64,balanced,0.029450667401154835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,64,power_law_1.01,0.03200640082359314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,64,power_law_1.01,0.032025599479675294
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,64,power_law_1.2,0.030675199627876282
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,64,power_law_1.2,0.032927998900413515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,8,balanced,0.029498666524887085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,8,balanced,0.02976000060637792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,8,power_law_1.01,0.0750976026058197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,8,power_law_1.01,0.0754751980304718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,8,power_law_1.2,0.07311360239982605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,1,8,power_law_1.2,0.07428479790687562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,16,1,balanced,0.02945599953333537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,16,1,balanced,0.02959999938805898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,16,1,power_law_1.01,0.027897599339485168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,16,1,power_law_1.01,0.028064000606536865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,16,1,power_law_1.2,0.02807680070400238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,16,1,power_law_1.2,0.029785600304603577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,2,1,balanced,0.05420800050099691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,2,1,balanced,0.05427733560403188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,2,1,power_law_1.01,0.051974397897720334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,2,1,power_law_1.01,0.053260797262191774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,2,1,power_law_1.2,0.05281919836997986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,2,1,power_law_1.2,0.0538752019405365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,32,1,balanced,0.029146666328112285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,32,1,balanced,0.029232000311215717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,32,1,power_law_1.01,0.027724799513816834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,32,1,power_law_1.01,0.02802560031414032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,32,1,power_law_1.2,0.02746880054473877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,32,1,power_law_1.2,0.028064000606536865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,4,1,balanced,0.03550933301448822
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,4,1,balanced,0.035589332381884255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,4,1,power_law_1.01,0.031046399474143983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,4,1,power_law_1.01,0.033580800890922545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,4,1,power_law_1.2,0.03110400140285492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,4,1,power_law_1.2,0.031699201464653014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,8,1,balanced,0.029919999341169994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,8,1,balanced,0.03150933235883713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,8,1,power_law_1.01,0.02842240035533905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,8,1,power_law_1.01,0.030246400833129884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,8,1,power_law_1.2,0.02805759906768799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2048,8,256,8,1,power_law_1.2,0.028217598795890808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,1,balanced,0.08893332878748576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,1,balanced,0.08987733721733093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,1,power_law_1.01,0.08654720187187195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,1,power_law_1.01,0.08809599876403809
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,1,power_law_1.2,0.08814719915390015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,1,power_law_1.2,0.08859519958496094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,16,balanced,0.029088000456492107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,16,balanced,0.029680001238981884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,16,power_law_1.01,0.0642687976360321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,16,power_law_1.01,0.0661952018737793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,16,power_law_1.2,0.05919359922409058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,16,power_law_1.2,0.06059520244598389
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,2,balanced,0.0613919993241628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,2,balanced,0.06241600215435028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,2,power_law_1.01,0.08368639945983887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,2,power_law_1.01,0.08580480217933655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,2,power_law_1.2,0.07466239929199218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,2,power_law_1.2,0.07496960163116455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,32,balanced,0.02943466603755951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,32,balanced,0.029616000751654308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,32,power_law_1.01,0.046988800168037415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,32,power_law_1.01,0.04780159890651703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,32,power_law_1.2,0.045977601408958436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,32,power_law_1.2,0.0469760000705719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,4,balanced,0.0407679999868075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,4,balanced,0.04137066751718521
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,4,power_law_1.01,0.07988479733467102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,4,power_law_1.01,0.08108159899711609
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,4,power_law_1.2,0.06707839965820313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,4,power_law_1.2,0.07200000286102295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,8,balanced,0.02939733366171519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,8,balanced,0.029717333614826202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,8,power_law_1.01,0.07694720029830933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,8,power_law_1.01,0.08025599718093872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,8,power_law_1.2,0.06458240151405334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,1,8,power_law_1.2,0.06803839802742004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,2,1,balanced,0.06197333335876465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,2,1,balanced,0.06232533355553945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,2,1,power_law_1.01,0.060601598024368285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,2,1,power_law_1.01,0.060787200927734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,2,1,power_law_1.2,0.061312001943588254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,2,1,power_law_1.2,0.061945599317550656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,4,1,balanced,0.04491200049718221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,4,1,balanced,0.045109331607818604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,4,1,power_law_1.01,0.04384639859199524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,4,1,power_law_1.01,0.044300800561904906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,4,1,power_law_1.2,0.04436480104923248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,4,1,power_law_1.2,0.0451200008392334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,8,1,balanced,0.030229332546393078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,8,1,balanced,0.03133866687615713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,8,1,power_law_1.01,0.02913280129432678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,8,1,power_law_1.01,0.029811200499534608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,8,1,power_law_1.2,0.03142400085926056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,6144,2560,8,160,8,1,power_law_1.2,0.03164800107479095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,1,balanced,0.08515733480453491
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,1,balanced,0.0865760048230489
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,1,power_law_1.01,0.08225280046463013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,1,power_law_1.01,0.08462719917297364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,1,power_law_1.2,0.08282880187034607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,1,power_law_1.2,0.0838271975517273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,128,balanced,0.029498666524887085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,128,balanced,0.0295413335164388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,128,power_law_1.01,0.027379199862480164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,128,power_law_1.01,0.0281792014837265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,128,power_law_1.2,0.027526399493217467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,128,power_law_1.2,0.029228800535202028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,16,balanced,0.02920000006755193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,16,balanced,0.0308693324526151
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,16,power_law_1.01,0.08428800106048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,16,power_law_1.01,0.08453760147094727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,16,power_law_1.2,0.07912319898605347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,16,power_law_1.2,0.08459519743919372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,2,balanced,0.05799466868241628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,2,balanced,0.05819733440876007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,2,power_law_1.01,0.08416640162467956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,2,power_law_1.01,0.08440319895744323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,2,power_law_1.2,0.08124799728393554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,2,power_law_1.2,0.08170239925384522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,256,balanced,0.027456000447273254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,256,balanced,0.027727998793125153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,256,power_law_1.01,0.025939199328422546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,256,power_law_1.01,0.02789120078086853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,256,power_law_1.2,0.027136000990867614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,256,power_law_1.2,0.02805759906768799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,32,balanced,0.029466666281223297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,32,balanced,0.029477333029111225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,32,power_law_1.01,0.05505920052528381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,32,power_law_1.01,0.05631999969482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,32,power_law_1.2,0.05500800013542175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,32,power_law_1.2,0.056908798217773435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,4,balanced,0.03728000074625015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,4,balanced,0.037871999045213066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,4,power_law_1.01,0.08325759768486023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,4,power_law_1.01,0.08467199802398681
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,4,power_law_1.2,0.08363519906997681
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,4,power_law_1.2,0.08403840065002441
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,64,balanced,0.029498666524887085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,64,balanced,0.031231999397277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,64,power_law_1.01,0.03542400002479553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,64,power_law_1.01,0.03587839901447296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,64,power_law_1.2,0.035129600763320924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,64,power_law_1.2,0.037036800384521486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,8,balanced,0.029509333272775013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,8,balanced,0.02956799914439519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,8,power_law_1.01,0.08312960267066956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,8,power_law_1.01,0.08435840010643006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,8,power_law_1.2,0.08246399760246277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,1,8,power_law_1.2,0.08314239978790283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,16,1,balanced,0.03092266619205475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,16,1,balanced,0.03145600110292435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,16,1,power_law_1.01,0.02922239899635315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,16,1,power_law_1.01,0.030847999453544616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,16,1,power_law_1.2,0.029158401489257812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,16,1,power_law_1.2,0.030559998750686646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,2,1,balanced,0.056890666484832764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,2,1,balanced,0.05942933261394501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,2,1,power_law_1.01,0.05677440166473389
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,2,1,power_law_1.01,0.057017600536346434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,2,1,power_law_1.2,0.05632640123367309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,2,1,power_law_1.2,0.0574400007724762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,32,1,balanced,0.031311998764673867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,32,1,balanced,0.032298666735490165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,32,1,power_law_1.01,0.02892799973487854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,32,1,power_law_1.01,0.030348798632621764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,32,1,power_law_1.2,0.028460800647735596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,32,1,power_law_1.2,0.02858240008354187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,4,1,balanced,0.037104000647862755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,4,1,balanced,0.03997333347797394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,4,1,power_law_1.01,0.03592320084571839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,4,1,power_law_1.01,0.03788160085678101
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,4,1,power_law_1.2,0.0348800003528595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,4,1,power_law_1.2,0.03551360070705414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,8,1,balanced,0.03259200106064478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,8,1,balanced,0.03370666752258936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,8,1,power_law_1.01,0.029631999135017396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,8,1,power_law_1.01,0.030444800853729248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,8,1,power_law_1.2,0.02900480031967163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,256,8,1,power_law_1.2,0.0302592009305954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,1,balanced,0.08504533767700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,1,balanced,0.08548800150553386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,1,power_law_1.01,0.08325120210647582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,1,power_law_1.01,0.08335360288619995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,1,power_law_1.2,0.08291199803352356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,1,power_law_1.2,0.08436480164527893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,128,balanced,0.02811199923356374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,128,balanced,0.02939733366171519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,128,power_law_1.01,0.02839680016040802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,128,power_law_1.01,0.029414400458335876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,128,power_law_1.2,0.028934401273727418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,128,power_law_1.2,0.02913280129432678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,16,balanced,0.02922133356332779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,16,balanced,0.0312266672650973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,16,power_law_1.01,0.0826367974281311
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,16,power_law_1.01,0.08320639729499817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,16,power_law_1.2,0.08254719972610473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,16,power_law_1.2,0.08332800269126892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,2,balanced,0.057818666100502014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,2,balanced,0.05786666770776113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,2,power_law_1.01,0.08316799998283386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,2,power_law_1.01,0.08428800106048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,2,power_law_1.2,0.08358399868011475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,2,power_law_1.2,0.08394880294799804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,32,balanced,0.029450667401154835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,32,balanced,0.03127466638882955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,32,power_law_1.01,0.06906239986419678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,32,power_law_1.01,0.07032960057258605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,32,power_law_1.2,0.06912000179290771
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,32,power_law_1.2,0.06937599778175355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,4,balanced,0.03339733431736628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,4,balanced,0.035616000493367515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,4,power_law_1.01,0.08399360179901123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,4,power_law_1.01,0.08424959778785705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,4,power_law_1.2,0.08321920037269592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,4,power_law_1.2,0.08370559811592101
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,64,balanced,0.029504001140594482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,64,balanced,0.02959466725587845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,64,power_law_1.01,0.050310397148132326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,64,power_law_1.01,0.05063040256500244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,64,power_law_1.2,0.050291198492050174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,64,power_law_1.2,0.05106559991836548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,8,balanced,0.031173333525657654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,8,balanced,0.03164800008138021
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,8,power_law_1.01,0.08342400193214417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,8,power_law_1.01,0.08410879969596863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,8,power_law_1.2,0.08354560136795045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,1,8,power_law_1.2,0.08385279774665833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,16,1,balanced,0.03089066594839096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,16,1,balanced,0.03138133386770884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,16,1,power_law_1.01,0.02937600016593933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,16,1,power_law_1.01,0.029446399211883544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,16,1,power_law_1.2,0.030451199412345885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,16,1,power_law_1.2,0.03059839904308319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,2,1,balanced,0.058058664202690125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,2,1,balanced,0.05899199843406677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,2,1,power_law_1.01,0.05624960064888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,2,1,power_law_1.01,0.05681920051574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,2,1,power_law_1.2,0.05740799903869629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,2,1,power_law_1.2,0.05799040198326111
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,32,1,balanced,0.03155199935038885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,32,1,balanced,0.032602667808532715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,32,1,power_law_1.01,0.028972798585891725
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,32,1,power_law_1.01,0.02908799946308136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,32,1,power_law_1.2,0.02821120023727417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,32,1,power_law_1.2,0.02876160144805908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,4,1,balanced,0.03772799919048945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,4,1,balanced,0.038389332592487335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,4,1,power_law_1.01,0.03620480000972748
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,4,1,power_law_1.01,0.037299200892448425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,4,1,power_law_1.2,0.03555839955806732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,4,1,power_law_1.2,0.03566080033779144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,8,1,balanced,0.031285333136717476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,8,1,balanced,0.03165333221356074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,8,1,power_law_1.01,0.029747200012207032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,8,1,power_law_1.01,0.030265599489212036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,8,1,power_law_1.2,0.030060800909996032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2,7168,2048,8,384,8,1,power_law_1.2,0.031276801228523256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,1,balanced,0.1509866714477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,1,balanced,0.1527253290017446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,1,power_law_1.01,0.17650560140609742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,1,power_law_1.01,0.17741440534591674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,1,power_law_1.2,0.1811903953552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,1,power_law_1.2,0.18929920196533204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,128,balanced,0.04997866849104563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,128,balanced,0.050399998823801674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,128,power_law_1.01,0.05045120120048523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,128,power_law_1.01,0.05063679814338684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,128,power_law_1.2,0.0531391978263855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,128,power_law_1.2,0.05408639907836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,16,balanced,0.05197333296140035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,16,balanced,0.05201066533724467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,16,power_law_1.01,0.05878400206565857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,16,power_law_1.01,0.06042879819869995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,16,power_law_1.2,0.06114559769630432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,16,power_law_1.2,0.06339200139045716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,2,balanced,0.09898133079210918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,2,balanced,0.10188266634941101
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,2,power_law_1.01,0.12332160472869873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,2,power_law_1.01,0.13059840202331544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,2,power_law_1.2,0.12529280185699462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,2,power_law_1.2,0.12692480087280272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,32,balanced,0.050442665815353394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,32,balanced,0.05207466582457224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,32,power_law_1.01,0.05541759729385376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,32,power_law_1.01,0.05737599730491638
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,32,power_law_1.2,0.0576960027217865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,32,power_law_1.2,0.059520000219345094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,4,balanced,0.0758240024248759
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,4,balanced,0.07626666625340779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,4,power_law_1.01,0.09102079868316651
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,4,power_law_1.01,0.09155200123786926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,4,power_law_1.2,0.09409279823303222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,4,power_law_1.2,0.09509119987487794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,64,balanced,0.050069332122802734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,64,balanced,0.05136000116666158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,64,power_law_1.01,0.051667201519012454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,64,power_law_1.01,0.05283839702606201
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,64,power_law_1.2,0.05413119792938233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,64,power_law_1.2,0.05457280278205871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,8,balanced,0.05863999823729197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,8,balanced,0.06029333174228668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,8,power_law_1.01,0.06893439888954163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,8,power_law_1.01,0.07361279726028443
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,8,power_law_1.2,0.07392640113830566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,1,8,power_law_1.2,0.07474560141563416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,2,1,balanced,0.1086133321126302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,2,1,balanced,0.10970133543014526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,2,1,power_law_1.01,0.12021759748458863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,2,1,power_law_1.01,0.12148480415344239
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,2,1,power_law_1.2,0.12151039838790893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,2,1,power_law_1.2,0.12216320037841796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,4,1,balanced,0.09987200299898784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,4,1,balanced,0.10821866989135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,4,1,power_law_1.01,0.11077760457992554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,4,1,power_law_1.01,0.11977599859237671
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,4,1,power_law_1.2,0.11101440191268921
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,2048,768,8,128,4,1,power_law_1.2,0.11185920238494873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,1,balanced,0.4431146780649821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,1,balanced,0.44698135058085126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,1,power_law_1.01,0.5267519950866699
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,1,power_law_1.01,0.5325632095336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,1,power_law_1.2,0.5545472145080567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,1,power_law_1.2,0.5575168132781982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,128,balanced,0.058634668588638306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,128,balanced,0.05931200087070465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,128,power_law_1.01,0.06079360246658325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,128,power_law_1.01,0.06297600269317627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,128,power_law_1.2,0.06563839912414551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,128,power_law_1.2,0.06589440107345582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,16,balanced,0.08760000268618266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,16,balanced,0.08852799733479817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,16,power_law_1.01,0.09459840059280396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,16,power_law_1.01,0.09578239917755127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,16,power_law_1.2,0.09634559750556945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,16,power_law_1.2,0.0981760025024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,2,balanced,0.21967466672261557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,2,balanced,0.22051199277242026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,2,power_law_1.01,0.2527359962463379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,2,power_law_1.01,0.25793280601501467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,2,power_law_1.2,0.2671231985092163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,2,power_law_1.2,0.2682496070861816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,256,balanced,0.058575997749964394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,256,balanced,0.05866133173306783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,256,power_law_1.01,0.05852159857749939
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,256,power_law_1.01,0.0588096022605896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,256,power_law_1.2,0.061900800466537474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,256,power_law_1.2,0.06199679970741272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,32,balanced,0.07271466652552287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,32,balanced,0.07398400207360585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,32,power_law_1.01,0.08030719757080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,32,power_law_1.01,0.08044160008430482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,32,power_law_1.2,0.0824832022190094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,32,power_law_1.2,0.08284800052642823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,4,balanced,0.16262400150299072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,4,balanced,0.1632319986820221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,4,power_law_1.01,0.1756608009338379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,4,power_law_1.01,0.18996479511260986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,4,power_law_1.2,0.19759999513626098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,4,power_law_1.2,0.2231231927871704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,64,balanced,0.060122668743133545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,64,balanced,0.062074666221936546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,64,power_law_1.01,0.0680895984172821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,64,power_law_1.01,0.06918399930000305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,64,power_law_1.2,0.07015680074691773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,64,power_law_1.2,0.07349759936332703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,8,balanced,0.1116480032602946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,8,balanced,0.11243733763694763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,8,power_law_1.01,0.1170240044593811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,8,power_law_1.01,0.11845120191574096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,8,power_law_1.2,0.12269439697265624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,1,8,power_law_1.2,0.12661759853363036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,2,1,balanced,0.2751839955647786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,2,1,balanced,0.27771733204523724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,2,1,power_law_1.01,0.31950719356536866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,2,1,power_law_1.01,0.3208832025527954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,2,1,power_law_1.2,0.33263359069824217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,2,1,power_law_1.2,0.3356031894683838
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,4,1,balanced,0.19366933902104697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,4,1,balanced,0.19435733556747437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,4,1,power_law_1.01,0.2179647922515869
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,4,1,power_law_1.01,0.21926400661468506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,4,1,power_law_1.2,0.2223423957824707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,4,1,power_law_1.2,0.22295680046081542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,8,1,balanced,0.15824533502260843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,8,1,balanced,0.15843733151753744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,8,1,power_law_1.01,0.1692352056503296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,8,1,power_law_1.01,0.16948479413986206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,8,1,power_law_1.2,0.17170560359954834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,3072,1536,8,256,8,1,power_law_1.2,0.17260160446166992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,1,balanced,0.4612480004628499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,1,balanced,0.4665439923604329
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,1,power_law_1.01,0.5341375827789306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,1,power_law_1.01,0.5607808113098145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,1,power_law_1.2,0.5183743953704834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,1,power_law_1.2,0.5274687767028808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,2,balanced,0.2683839996655782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,2,balanced,0.27190399169921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,2,power_law_1.01,0.36980481147766114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,2,power_law_1.01,0.38996479511260984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,2,power_law_1.2,0.38156800270080565
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,2,power_law_1.2,0.4232128143310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,4,balanced,0.17204799254735312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,4,balanced,0.17350399494171143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,4,power_law_1.01,0.28845438957214353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,4,power_law_1.01,0.29745280742645264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,4,power_law_1.2,0.27317759990692136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,4,power_law_1.2,0.30349440574645997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,8,balanced,0.12063466509183247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,8,balanced,0.12134400010108948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,8,power_law_1.01,0.24992001056671143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,8,power_law_1.01,0.25073919296264646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,8,power_law_1.2,0.2576319932937622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,1,8,power_law_1.2,0.2589888095855713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,16,1,balanced,0.09714133540789287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,16,1,balanced,0.09782933195432027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,16,1,power_law_1.01,0.09920639991760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,16,1,power_law_1.01,0.09959679841995239
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,16,1,power_law_1.2,0.09934719800949096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,16,1,power_law_1.2,0.10043519735336304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,2,1,balanced,0.26360533634821576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,2,1,balanced,0.26367467641830444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,2,1,power_law_1.01,0.30076160430908205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,2,1,power_law_1.01,0.32419838905334475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,2,1,power_law_1.2,0.2877568006515503
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,2,1,power_law_1.2,0.2910271883010864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,32,1,balanced,0.08473599950472514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,32,1,balanced,0.08693333466847737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,32,1,power_law_1.01,0.08707839846611024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,32,1,power_law_1.01,0.08746240139007569
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,32,1,power_law_1.2,0.08532480001449586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,32,1,power_law_1.2,0.08551040291786194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,4,1,balanced,0.17055465777715048
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,4,1,balanced,0.1707520087560018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,4,1,power_law_1.01,0.18197760581970215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,4,1,power_law_1.01,0.19027199745178222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,4,1,power_law_1.2,0.18498560190200805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,4,1,power_law_1.2,0.20051839351654052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,8,1,balanced,0.12131200234095256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,8,1,balanced,0.12357333302497864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,8,1,power_law_1.01,0.1270784020423889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,8,1,power_law_1.01,0.12932480573654176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,8,1,power_law_1.2,0.12343039512634277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,14336,2,8,8,1,power_law_1.2,0.12464640140533448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,1,balanced,0.36717867851257324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,1,balanced,0.3683946530024211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,1,power_law_1.01,0.43904638290405273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,1,power_law_1.01,0.4397183895111084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,1,power_law_1.2,0.4505152225494385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,1,power_law_1.2,0.45131521224975585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,128,balanced,0.06624533236026764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,128,balanced,0.06640000144640605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,128,power_law_1.01,0.0722495973110199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,128,power_law_1.01,0.07236480116844177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,128,power_law_1.2,0.07951359748840332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,128,power_law_1.2,0.08300799727439881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,16,balanced,0.08746133248011272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,16,balanced,0.08752000331878662
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,16,power_law_1.01,0.10028159618377686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,16,power_law_1.01,0.1028223991394043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,16,power_law_1.2,0.11096320152282715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,16,power_law_1.2,0.11370879411697388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,2,balanced,0.19711466630299887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,2,balanced,0.1981066664059957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,2,power_law_1.01,0.23848960399627686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,2,power_law_1.01,0.25289599895477294
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,2,power_law_1.2,0.2563136100769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,2,power_law_1.2,0.2695359945297241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,32,balanced,0.07317333420117696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,32,balanced,0.07422400017579396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,32,power_law_1.01,0.08739200234413147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,32,power_law_1.01,0.092985600233078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,32,power_law_1.2,0.09779840111732482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,32,power_law_1.2,0.09802240133285522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,4,balanced,0.13708800077438354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,4,balanced,0.13807466626167297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,4,power_law_1.01,0.1701696038246155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,4,power_law_1.01,0.1729856014251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,4,power_law_1.2,0.18346879482269288
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,4,power_law_1.2,0.19546879529953004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,64,balanced,0.06649599969387054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,64,balanced,0.06745600203673045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,64,power_law_1.01,0.07728000283241272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,64,power_law_1.01,0.08077440261840821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,64,power_law_1.2,0.08478720188140869
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,64,power_law_1.2,0.08860160112380981
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,8,balanced,0.10474133491516113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,8,balanced,0.1051680048306783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,8,power_law_1.01,0.12494720220565796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,8,power_law_1.01,0.12522239685058595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,8,power_law_1.2,0.13058559894561766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,1,8,power_law_1.2,0.13432320356369018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,2,1,balanced,0.2504693269729614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,2,1,balanced,0.25142399470011395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,2,1,power_law_1.01,0.28768000602722166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,2,1,power_law_1.01,0.2883968114852905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,2,1,power_law_1.2,0.2946687936782837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,2,1,power_law_1.2,0.2952320098876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,4,1,balanced,0.17705066998799643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,4,1,balanced,0.17890665928522745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,4,1,power_law_1.01,0.19306880235671997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,4,1,power_law_1.01,0.19557119607925416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,4,1,power_law_1.2,0.19667199850082398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,4,1,power_law_1.2,0.19722239971160888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,8,1,balanced,0.16565866271654764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,8,1,balanced,0.16607999801635742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,8,1,power_law_1.01,0.1831104040145874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,8,1,power_law_1.01,0.18486399650573732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,8,1,power_law_1.2,0.18455679416656495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,4096,1536,8,128,8,1,power_law_1.2,0.18655359745025635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,1,balanced,0.8621066411336263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,1,balanced,0.8657386302947998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,1,power_law_1.01,0.9666624069213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,1,power_law_1.01,0.9896575927734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,1,power_law_1.2,0.9427007675170899
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,1,power_law_1.2,0.9933952331542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,2,balanced,0.454581340154012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,2,balanced,0.45470933119455975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,2,power_law_1.01,0.6592319965362549
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,2,power_law_1.01,0.7007616043090821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,2,power_law_1.2,0.5799744129180908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,2,power_law_1.2,0.6673920154571533
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,4,balanced,0.26031466325124103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,4,balanced,0.26106133063634235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,4,power_law_1.01,0.481766414642334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,4,power_law_1.01,0.4824960231781006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,4,power_law_1.2,0.5065855979919434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,4,power_law_1.2,0.5701119899749756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,8,balanced,0.17299199104309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,8,balanced,0.17525867621103922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,8,power_law_1.01,0.38719360828399657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,8,power_law_1.01,0.40407681465148926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,8,power_law_1.2,0.4252799987792969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,1,8,power_law_1.2,0.4299776077270508
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,16,1,balanced,0.1288266678651174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,16,1,balanced,0.13006933530171713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,16,1,power_law_1.01,0.1292415976524353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,16,1,power_law_1.01,0.13062399625778198
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,16,1,power_law_1.2,0.13151999711990356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,16,1,power_law_1.2,0.13493119478225707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,2,1,balanced,0.4017653465270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,2,1,balanced,0.4026399850845337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,2,1,power_law_1.01,0.48439040184021
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,2,1,power_law_1.01,0.4958399772644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,2,1,power_law_1.2,0.46474242210388184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,2,1,power_law_1.2,0.4681087970733643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,32,1,balanced,0.10929600397745769
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,32,1,balanced,0.1095306674639384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,32,1,power_law_1.01,0.10944000482559205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,32,1,power_law_1.01,0.11141760349273681
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,32,1,power_law_1.2,0.11079679727554322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,32,1,power_law_1.2,0.11378560066223145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,4,1,balanced,0.24462399880091348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,4,1,balanced,0.2464639941851298
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,4,1,power_law_1.01,0.27806079387664795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,4,1,power_law_1.01,0.2797055959701538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,4,1,power_law_1.2,0.27280640602111816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,4,1,power_law_1.2,0.276364803314209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,8,1,balanced,0.16827199856440225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,8,1,balanced,0.16854933897654215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,8,1,power_law_1.01,0.18184959888458252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,8,1,power_law_1.01,0.1923840045928955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,8,1,power_law_1.2,0.1838912010192871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,16384,2,8,8,1,power_law_1.2,0.18925440311431885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,1,balanced,1.0867839654286702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,1,balanced,1.0916852951049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,1,power_law_1.01,1.3119935989379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,1,power_law_1.01,1.3279359817504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,1,power_law_1.2,1.373459243774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,1,power_law_1.2,1.3735487937927247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,128,balanced,0.09332799911499023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,128,balanced,0.09525866309801738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,128,power_law_1.01,0.10376960039138794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,128,power_law_1.01,0.10543999671936036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,128,power_law_1.2,0.10815999507904053
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,128,power_law_1.2,0.1093567967414856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,16,balanced,0.148117333650589
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,16,balanced,0.14839999874432883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,16,power_law_1.01,0.15865600109100342
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,16,power_law_1.01,0.16064000129699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,16,power_law_1.2,0.16773120164871216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,16,power_law_1.2,0.17658239603042603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,2,balanced,0.5013386805852255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,2,balanced,0.5024533271789551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,2,power_law_1.01,0.6100671768188477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,2,power_law_1.01,0.6228032112121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,2,power_law_1.2,0.6425343990325928
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,2,power_law_1.2,0.6427519798278809
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,256,balanced,0.08480000495910645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,256,balanced,0.08692800005276997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,256,power_law_1.01,0.09446399807929992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,256,power_law_1.01,0.09484800100326538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,256,power_law_1.2,0.10158079862594604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,256,power_law_1.2,0.10269440412521362
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,32,balanced,0.11961600184440613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,32,balanced,0.11962133646011353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,32,power_law_1.01,0.12991360425949097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,32,power_law_1.01,0.13096319437026976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,32,power_law_1.2,0.13713279962539673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,32,power_law_1.2,0.1427199959754944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,4,balanced,0.3370026747385661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,4,balanced,0.3417066733042399
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,4,power_law_1.01,0.3606719970703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,4,power_law_1.01,0.36240639686584475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,4,power_law_1.2,0.422214412689209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,4,power_law_1.2,0.42554240226745604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,64,balanced,0.10297066966692607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,64,balanced,0.103301336367925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,64,power_law_1.01,0.10971519947052003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,64,power_law_1.01,0.11169279813766479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,64,power_law_1.2,0.11889280080795288
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,64,power_law_1.2,0.1223296046257019
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,8,balanced,0.2046133279800415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,8,balanced,0.20562666654586792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,8,power_law_1.01,0.2226560115814209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,8,power_law_1.01,0.23092479705810548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,8,power_law_1.2,0.23381121158599855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,1,8,power_law_1.2,0.2403968095779419
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,16,1,balanced,0.24543466170628866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,16,1,balanced,0.24643200635910034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,16,1,power_law_1.01,0.27331840991973877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,16,1,power_law_1.01,0.27358720302581785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,16,1,power_law_1.2,0.27447679042816164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,16,1,power_law_1.2,0.2753472089767456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,2,1,balanced,0.6041973431905111
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,2,1,balanced,0.6058773199717203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,2,1,power_law_1.01,0.7083903789520264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,2,1,power_law_1.01,0.7090176105499267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,2,1,power_law_1.2,0.7404799938201905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,2,1,power_law_1.2,0.7428160190582276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,32,1,balanced,0.22646933794021606
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,32,1,balanced,0.22800532976786295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,32,1,power_law_1.01,0.24749441146850587
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,32,1,power_law_1.01,0.2488447904586792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,32,1,power_law_1.2,0.24968318939208983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,32,1,power_law_1.2,0.2506047964096069
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,4,1,balanced,0.39019731680552167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,4,1,balanced,0.39057600498199463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,4,1,power_law_1.01,0.4393727779388428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,4,1,power_law_1.01,0.4406464099884033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,4,1,power_law_1.2,0.4593023777008057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,4,1,power_law_1.2,0.45999999046325685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,8,1,balanced,0.28734399875005084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,8,1,balanced,0.28757333755493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,8,1,power_law_1.01,0.32127358913421633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,8,1,power_law_1.01,0.3213567972183228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,8,1,power_law_1.2,0.32778880596160886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2048,8,256,8,1,power_law_1.2,0.32856318950653074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,1,balanced,1.016821304957072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,1,balanced,1.0677653153737385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,1,power_law_1.01,1.0937664031982421
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,1,power_law_1.01,1.0987135887145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,1,power_law_1.2,1.113868808746338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,1,power_law_1.2,1.1172287940979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,16,balanced,0.13398399949073792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,16,balanced,0.1356053352355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,16,power_law_1.01,0.16621439456939696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,16,power_law_1.01,0.17578879594802857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,16,power_law_1.2,0.18099839687347413
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,16,power_law_1.2,0.1839359998703003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,2,balanced,0.49378665288289386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,2,balanced,0.49696532885233563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,2,power_law_1.01,0.6010496139526367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,2,power_law_1.01,0.6271615982055664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,2,power_law_1.2,0.6255616188049317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,2,power_law_1.2,0.62773118019104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,32,balanced,0.11358933647473653
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,32,balanced,0.11457600196202596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,32,power_law_1.01,0.13626240491867064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,32,power_law_1.01,0.13780479431152343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,32,power_law_1.2,0.15231360197067262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,32,power_law_1.2,0.15252480506896973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,4,balanced,0.26080000400543213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,4,balanced,0.2609386642773946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,4,power_law_1.01,0.33892478942871096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,4,power_law_1.01,0.36894080638885496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,4,power_law_1.2,0.3998528003692627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,4,power_law_1.2,0.41047039031982424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,8,balanced,0.1792853275934855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,8,balanced,0.17993066708246866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,8,power_law_1.01,0.21929600238800048
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,8,power_law_1.01,0.22519679069519044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,8,power_law_1.2,0.23875839710235597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,1,8,power_law_1.2,0.24754559993743896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,2,1,balanced,0.5656799872716268
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,2,1,balanced,0.5889600118001302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,2,1,power_law_1.01,0.6251584053039551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,2,1,power_law_1.01,0.6288640022277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,2,1,power_law_1.2,0.6430079936981201
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,2,1,power_law_1.2,0.6555007934570313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,4,1,balanced,0.40990400314331055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,4,1,balanced,0.42867199579874676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,4,1,power_law_1.01,0.41707520484924315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,4,1,power_law_1.01,0.41826558113098145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,4,1,power_law_1.2,0.4267136096954346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,4,1,power_law_1.2,0.4282048225402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,8,1,balanced,0.2801813284556071
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,8,1,balanced,0.29305599133173627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,8,1,power_law_1.01,0.29427199363708495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,8,1,power_law_1.01,0.2943487882614136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,8,1,power_law_1.2,0.3019903898239136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,6144,2560,8,160,8,1,power_law_1.2,0.3046976089477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,1,balanced,1.2561279932657878
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,1,balanced,1.2838079929351807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,1,power_law_1.01,1.5242560386657715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,1,power_law_1.01,1.5376255989074707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,1,power_law_1.2,1.6019136428833007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,1,power_law_1.2,1.6163455963134765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,128,balanced,0.10531199971834819
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,128,balanced,0.10551466544469197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,128,power_law_1.01,0.11438080072402954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,128,power_law_1.01,0.11604479551315308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,128,power_law_1.2,0.11969280242919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,128,power_law_1.2,0.12407040596008301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,16,balanced,0.16576000054677328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,16,balanced,0.16703999042510986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,16,power_law_1.01,0.18362879753112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,16,power_law_1.01,0.18994560241699218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,16,power_law_1.2,0.19809919595718384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,16,power_law_1.2,0.20087039470672607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,2,balanced,0.5829919974009196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,2,balanced,0.5838079849878947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,2,power_law_1.01,0.6946559906005859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,2,power_law_1.01,0.7158912181854248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,2,power_law_1.2,0.7425856113433837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,2,power_law_1.2,0.7462016105651855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,256,balanced,0.0997920036315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,256,balanced,0.10073066751162212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,256,power_law_1.01,0.10429439544677735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,256,power_law_1.01,0.1060096025466919
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,256,power_law_1.2,0.11304320096969604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,256,power_law_1.2,0.11404160261154175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,32,balanced,0.1359946628411611
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,32,balanced,0.13733866810798645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,32,power_law_1.01,0.14315520524978637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,32,power_law_1.01,0.14590079784393312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,32,power_law_1.2,0.15537279844284058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,32,power_law_1.2,0.1585088014602661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,4,balanced,0.38942933082580566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,4,balanced,0.3965919812520345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,4,power_law_1.01,0.44364161491394044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,4,power_law_1.01,0.4463615894317627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,4,power_law_1.2,0.46437759399414064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,4,power_law_1.2,0.5084864139556885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,64,balanced,0.11686399579048157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,64,balanced,0.1179146667321523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,64,power_law_1.01,0.1278720021247864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,64,power_law_1.01,0.12997119426727294
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,64,power_law_1.2,0.13502720594406128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,64,power_law_1.2,0.13897600173950195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,8,balanced,0.233514666557312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,8,balanced,0.23465599616368613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,8,power_law_1.01,0.25655040740966795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,8,power_law_1.01,0.26256000995635986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,8,power_law_1.2,0.2843712091445923
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,1,8,power_law_1.2,0.2856575965881348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,16,1,balanced,0.2821439901987712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,16,1,balanced,0.28260799249013263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,16,1,power_law_1.01,0.31217920780181885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,16,1,power_law_1.01,0.3126336097717285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,16,1,power_law_1.2,0.31789441108703614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,16,1,power_law_1.2,0.3181119918823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,2,1,balanced,0.7024373213450114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,2,1,balanced,0.7030080159505209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,2,1,power_law_1.01,0.8277824401855469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,2,1,power_law_1.01,0.8373056411743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,2,1,power_law_1.2,0.8605055809020996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,2,1,power_law_1.2,0.8607616424560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,32,1,balanced,0.2601919968922933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,32,1,balanced,0.260917325814565
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,32,1,power_law_1.01,0.2849855899810791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,32,1,power_law_1.01,0.28568320274353026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,32,1,power_law_1.2,0.287718391418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,32,1,power_law_1.2,0.2882303953170776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,4,1,balanced,0.45076266924540204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,4,1,balanced,0.45262932777404785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,4,1,power_law_1.01,0.5130815982818604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,4,1,power_law_1.01,0.5132160186767578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,4,1,power_law_1.2,0.5273983955383301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,4,1,power_law_1.2,0.5274496078491211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,8,1,balanced,0.3322880069414775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,8,1,balanced,0.3325653274854024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,8,1,power_law_1.01,0.3695807933807373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,8,1,power_law_1.01,0.36990718841552733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,8,1,power_law_1.2,0.3772671937942505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,256,8,1,power_law_1.2,0.3780607938766479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,1,balanced,1.837056001027425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,1,balanced,1.8933013280232747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,1,power_law_1.01,1.8016767501831055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,1,power_law_1.01,1.8061376571655274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,1,power_law_1.2,1.9316991806030273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,1,power_law_1.2,1.9344959259033203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,128,balanced,0.10946666200955708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,128,balanced,0.10948266585667928
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,128,power_law_1.01,0.11606400012969971
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,128,power_law_1.01,0.11626880168914795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,128,power_law_1.2,0.11805440187454223
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,128,power_law_1.2,0.12195199728012085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,16,balanced,0.19890666007995605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,16,balanced,0.2049973408381144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,16,power_law_1.01,0.2020479917526245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,16,power_law_1.01,0.20602879524230958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,16,power_law_1.2,0.22176640033721923
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,16,power_law_1.2,0.22184960842132567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,2,balanced,0.821557362874349
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,2,balanced,0.8243093490600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,2,power_law_1.01,0.8807552337646485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,2,power_law_1.01,0.8944512367248535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,2,power_law_1.2,0.9182527542114258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,2,power_law_1.2,0.922265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,32,balanced,0.15016000469525656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,32,balanced,0.15106133619944254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,32,power_law_1.01,0.15245440006256103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,32,power_law_1.01,0.1610368013381958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,32,power_law_1.2,0.16339839696884156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,32,power_law_1.2,0.16574079990386964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,4,balanced,0.8808586597442627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,4,balanced,0.9141653378804525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,4,power_law_1.01,0.5648320198059082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,4,power_law_1.01,0.6743680000305176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,4,power_law_1.2,0.6054912090301514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,4,power_law_1.2,0.6206912040710449
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,64,balanced,0.12745066483815512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,64,balanced,0.12786666552225748
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,64,power_law_1.01,0.12921600341796874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,64,power_law_1.01,0.13111040592193604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,64,power_law_1.2,0.13473279476165773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,64,power_law_1.2,0.13598079681396485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,8,balanced,0.2969599962234497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,8,balanced,0.2990880012512207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,8,power_law_1.01,0.30583040714263915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,8,power_law_1.01,0.3216768026351929
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,8,power_law_1.2,0.32436480522155764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,1,8,power_law_1.2,0.32617599964141847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,16,1,balanced,0.34827733039855957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,16,1,balanced,0.3490080038706462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,16,1,power_law_1.01,0.3398144006729126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,16,1,power_law_1.01,0.3405440092086792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,16,1,power_law_1.2,0.3466559886932373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,16,1,power_law_1.2,0.34679040908813474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,2,1,balanced,0.9672160148620605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,2,1,balanced,0.9842773278554281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,2,1,power_law_1.01,0.9573568344116211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,2,1,power_law_1.01,0.9661312103271484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,2,1,power_law_1.2,0.9974207878112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,2,1,power_law_1.2,1.0001536369323731
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,32,1,balanced,0.3157599965731303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,32,1,balanced,0.3162986636161804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,32,1,power_law_1.01,0.30661759376525877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,32,1,power_law_1.01,0.30808320045471194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,32,1,power_law_1.2,0.3129983901977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,32,1,power_law_1.2,0.3150784015655518
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,4,1,balanced,0.5936319828033447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,4,1,balanced,0.5942293405532837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,4,1,power_law_1.01,0.5764671802520752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,4,1,power_law_1.01,0.5778624057769776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,4,1,power_law_1.2,0.5987840175628663
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,4,1,power_law_1.2,0.6006336212158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,8,1,balanced,0.4192639986673991
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,8,1,balanced,0.4203786849975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,8,1,power_law_1.01,0.4042496204376221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,8,1,power_law_1.01,0.4066880226135254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,8,1,power_law_1.2,0.42096638679504395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,2048,7168,2048,8,384,8,1,power_law_1.2,0.42116479873657225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,1,balanced,0.09641599655151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,1,balanced,0.0976106623808543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,1,power_law_1.01,0.10718719959259033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,1,power_law_1.01,0.10729600191116333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,1,power_law_1.2,0.10703359842300415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,1,power_law_1.2,0.10758399963378906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,128,balanced,0.03540800015131632
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,128,balanced,0.03668266783157984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,128,power_law_1.01,0.03478400111198425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,128,power_law_1.01,0.03540480136871338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,128,power_law_1.2,0.03459199965000152
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,128,power_law_1.2,0.034643200039863584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,16,balanced,0.041946664452552795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,16,balanced,0.04241600135962168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,16,power_law_1.01,0.038431999087333676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,16,power_law_1.01,0.039212799072265624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,16,power_law_1.2,0.037254399061203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,16,power_law_1.2,0.03944959938526153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,2,balanced,0.0601440022389094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,2,balanced,0.06026133398214976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,2,power_law_1.01,0.06165760159492493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,2,power_law_1.01,0.06260480284690857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,2,power_law_1.2,0.06306560039520263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,2,power_law_1.2,0.06399999856948853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,32,balanced,0.037685332198937736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,32,balanced,0.03773866593837738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,32,power_law_1.01,0.036236798763275145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,32,power_law_1.01,0.0365119993686676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,32,power_law_1.2,0.03521920144557953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,32,power_law_1.2,0.03586559891700745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,4,balanced,0.042965332667032875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,4,balanced,0.043840001026789345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,4,power_law_1.01,0.04501760005950928
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,4,power_law_1.01,0.04614399969577789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,4,power_law_1.2,0.04390400052070618
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,4,power_law_1.2,0.04627200067043304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,64,balanced,0.0360000009338061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,64,balanced,0.03743999948104223
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,64,power_law_1.01,0.035488000512123107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,64,power_law_1.01,0.0361407995223999
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,64,power_law_1.2,0.03500800132751465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,64,power_law_1.2,0.035411199927330016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,8,balanced,0.03748800108830134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,8,balanced,0.03773866593837738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,8,power_law_1.01,0.03619199991226196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,8,power_law_1.01,0.03682560026645661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,8,power_law_1.2,0.037478399276733396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,1,8,power_law_1.2,0.03768959939479828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,2,1,balanced,0.0681333343187968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,2,1,balanced,0.06891733407974243
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,2,1,power_law_1.01,0.0732479989528656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,2,1,power_law_1.01,0.07343999743461609
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,2,1,power_law_1.2,0.0720255970954895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,2,1,power_law_1.2,0.07320320010185241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,4,1,balanced,0.056143999099731445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,4,1,balanced,0.05929600199063619
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,4,1,power_law_1.01,0.05870720148086548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,4,1,power_law_1.01,0.060761600732803345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,4,1,power_law_1.2,0.06021760106086731
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,2048,768,8,128,4,1,power_law_1.2,0.060550397634506224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,1,balanced,0.32076799869537354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,1,balanced,0.32174400488535565
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,1,power_law_1.01,0.29825921058654786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,1,power_law_1.01,0.30033919811248777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,1,power_law_1.2,0.3109823942184448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,1,power_law_1.2,0.31789441108703614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,128,balanced,0.0401706670721372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,128,balanced,0.04022933294375738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,128,power_law_1.01,0.0383103996515274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,128,power_law_1.01,0.038950398564338684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,128,power_law_1.2,0.0381632000207901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,128,power_law_1.2,0.03847039937973022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,16,balanced,0.06412266691525777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,16,balanced,0.06824533144632976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,16,power_law_1.01,0.05728639960289002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,16,power_law_1.01,0.05788159966468811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,16,power_law_1.2,0.05377920269966126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,16,power_law_1.2,0.055270397663116456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,2,balanced,0.1777706742286682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,2,balanced,0.17889066537221274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,2,power_law_1.01,0.1739840030670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,2,power_law_1.01,0.17724159955978394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,2,power_law_1.2,0.1729151964187622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,2,power_law_1.2,0.17550079822540282
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,256,balanced,0.03978666663169861
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,256,balanced,0.03986666599909464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,256,power_law_1.01,0.03802880048751831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,256,power_law_1.01,0.0381056010723114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,256,power_law_1.2,0.03733119964599609
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,256,power_law_1.2,0.03880960047245026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,32,balanced,0.07367999851703644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,32,balanced,0.07984533409277599
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,32,power_law_1.01,0.06241919994354248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,32,power_law_1.01,0.07244799733161926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,32,power_law_1.2,0.06606079936027527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,32,power_law_1.2,0.06817280054092408
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,4,balanced,0.10753066341082256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,4,balanced,0.10761599739392598
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,4,power_law_1.01,0.10117119550704956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,4,power_law_1.01,0.10376960039138794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,4,power_law_1.2,0.09845119714736938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,4,power_law_1.2,0.09980159997940063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,64,balanced,0.04370133578777313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,64,balanced,0.043951998154322304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,64,power_law_1.01,0.04104959964752197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,64,power_law_1.01,0.041228801012039185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,64,power_law_1.2,0.04111360013484955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,64,power_law_1.2,0.0421887993812561
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,8,balanced,0.07361066838105519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,8,balanced,0.07412800192832947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,8,power_law_1.01,0.06559360027313232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,8,power_law_1.01,0.06899200081825256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,8,power_law_1.2,0.06766080260276794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,1,8,power_law_1.2,0.06875519752502442
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,2,1,balanced,0.1813546617825826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,2,1,balanced,0.1817013422648112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,2,1,power_law_1.01,0.1804927945137024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,2,1,power_law_1.01,0.1820799946784973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,2,1,power_law_1.2,0.1831104040145874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,2,1,power_law_1.2,0.1843135952949524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,4,1,balanced,0.11750400066375732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,4,1,balanced,0.11883733669916789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,4,1,power_law_1.01,0.11433600187301636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,4,1,power_law_1.01,0.11639039516448975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,4,1,power_law_1.2,0.11753599643707276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,4,1,power_law_1.2,0.11920000314712524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,8,1,balanced,0.08681066830952962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,8,1,balanced,0.08825600147247314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,8,1,power_law_1.01,0.09040639996528625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,8,1,power_law_1.01,0.09099519848823548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,8,1,power_law_1.2,0.0914687991142273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,3072,1536,8,256,8,1,power_law_1.2,0.09175040125846863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,1,balanced,0.20055999358495077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,1,balanced,0.2017013430595398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,1,power_law_1.01,0.23137280941009522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,1,power_law_1.01,0.23221120834350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,1,power_law_1.2,0.2327039957046509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,1,power_law_1.2,0.23574399948120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,2,balanced,0.10085866848627727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,2,balanced,0.10147733489672343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,2,power_law_1.01,0.14016640186309814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,2,power_law_1.01,0.14648959636688233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,2,power_law_1.2,0.1291584014892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,2,power_law_1.2,0.13954559564590455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,4,balanced,0.17722133795420328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,4,balanced,0.1820853352546692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,4,power_law_1.01,0.08606719970703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,4,power_law_1.01,0.0866047978401184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,4,power_law_1.2,0.08727040290832519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,4,power_law_1.2,0.11167999505996704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,8,balanced,0.12132267157236735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,8,balanced,0.12918933232625326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,8,power_law_1.01,0.0733568012714386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,8,power_law_1.01,0.07418879866600037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,8,power_law_1.2,0.0754688024520874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,1,8,power_law_1.2,0.07560319900512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,16,1,balanced,0.04159999887148539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,16,1,balanced,0.0417546679576238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,16,1,power_law_1.01,0.043584001064300534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,16,1,power_law_1.01,0.04366720020771027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,16,1,power_law_1.2,0.043161600828170776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,16,1,power_law_1.2,0.04341759979724884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,2,1,balanced,0.11159466703732808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,2,1,balanced,0.1128053367137909
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,2,1,power_law_1.01,0.13036160469055175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,2,1,power_law_1.01,0.13282560110092162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,2,1,power_law_1.2,0.128985595703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,2,1,power_law_1.2,0.1321727991104126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,32,1,balanced,0.0373333344856898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,32,1,balanced,0.03774400055408478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,32,1,power_law_1.01,0.03713279962539673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,32,1,power_law_1.01,0.037376001477241516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,32,1,power_law_1.2,0.0377920001745224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,32,1,power_law_1.2,0.038047999143600464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,4,1,balanced,0.07557866473992665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,4,1,balanced,0.07648533085982005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,4,1,power_law_1.01,0.08102399706840516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,4,1,power_law_1.01,0.08120319843292237
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,4,1,power_law_1.2,0.0788096010684967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,4,1,power_law_1.2,0.08026880025863647
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,8,1,balanced,0.057706668972969055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,8,1,balanced,0.058245331048965454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,8,1,power_law_1.01,0.05764480233192444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,8,1,power_law_1.01,0.0576960027217865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,8,1,power_law_1.2,0.05856000185012818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,14336,2,8,8,1,power_law_1.2,0.05906559824943543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,1,balanced,0.2582506736119588
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,1,balanced,0.2593013246854146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,1,power_law_1.01,0.2917248010635376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,1,power_law_1.01,0.2937279939651489
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,1,power_law_1.2,0.30110080242156984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,1,power_law_1.2,0.30439679622650145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,128,balanced,0.04176533222198486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,128,balanced,0.04188266893227895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,128,power_law_1.01,0.03993600010871887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,128,power_law_1.01,0.04044159948825836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,128,power_law_1.2,0.04016000032424927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,128,power_law_1.2,0.04031359851360321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,16,balanced,0.090037335952123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,16,balanced,0.0938933293024699
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,16,power_law_1.01,0.06755200028419495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,16,power_law_1.01,0.0753279983997345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,16,power_law_1.2,0.07486720085144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,16,power_law_1.2,0.07988479733467102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,2,balanced,0.13432000080744425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,2,balanced,0.13635200262069702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,2,power_law_1.01,0.14090880155563354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,2,power_law_1.01,0.14099199771881105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,2,power_law_1.2,0.1430848002433777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,2,power_law_1.2,0.14748799800872803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,32,balanced,0.047413334250450134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,32,balanced,0.04780800143877665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,32,power_law_1.01,0.04312959909439087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,32,power_law_1.01,0.0438975989818573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,32,power_law_1.2,0.042982399463653564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,32,power_law_1.2,0.04318720102310181
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,4,balanced,0.08850666880607605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,4,balanced,0.08891733487447102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,4,power_law_1.01,0.08788480162620545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,4,power_law_1.01,0.08790400028228759
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,4,power_law_1.2,0.08963840007781983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,4,power_law_1.2,0.08975359797477722
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,64,balanced,0.043562665581703186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,64,balanced,0.04363733530044556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,64,power_law_1.01,0.040275201201438904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,64,power_law_1.01,0.040940800309181215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,64,power_law_1.2,0.04056960046291351
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,64,power_law_1.2,0.04145280122756958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,8,balanced,0.07025066514809926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,8,balanced,0.0707946668068568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,8,power_law_1.01,0.06385279893875122
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,8,power_law_1.01,0.06681600213050842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,8,power_law_1.2,0.06594560146331788
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,1,8,power_law_1.2,0.06876800060272217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,2,1,balanced,0.16249600052833557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,2,1,balanced,0.1644159952799479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,2,1,power_law_1.01,0.18184319734573365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,2,1,power_law_1.01,0.18201600313186644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,2,1,power_law_1.2,0.18574719429016112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,2,1,power_law_1.2,0.18630399703979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,4,1,balanced,0.10714133580525716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,4,1,balanced,0.10797333717346191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,4,1,power_law_1.01,0.11430399417877198
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,4,1,power_law_1.01,0.11520639657974244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,4,1,power_law_1.2,0.11489919424057007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,4,1,power_law_1.2,0.11560319662094116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,8,1,balanced,0.0862559974193573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,8,1,balanced,0.0867146650950114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,8,1,power_law_1.01,0.09067519903182983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,8,1,power_law_1.01,0.091212797164917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,8,1,power_law_1.2,0.09128959774971009
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,4096,1536,8,128,8,1,power_law_1.2,0.09207680225372314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,1,balanced,0.39027734597524005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,1,balanced,0.3923146724700928
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,1,power_law_1.01,0.4418496131896973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,1,power_law_1.01,0.4606527805328369
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,1,power_law_1.2,0.45571198463439944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,1,power_law_1.2,0.4661888122558594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,2,balanced,0.15516266226768494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,2,balanced,0.1560640037059784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,2,power_law_1.01,0.221343994140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,2,power_law_1.01,0.223142409324646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,2,power_law_1.2,0.2090751886367798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,2,power_law_1.2,0.217958402633667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,4,balanced,0.2299519975980123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,4,balanced,0.23736000061035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,4,power_law_1.01,0.11921279430389405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,4,power_law_1.01,0.1502079963684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,4,power_law_1.2,0.11679359674453735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,4,power_law_1.2,0.21071360111236573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,8,balanced,0.14589333534240723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,8,balanced,0.14779200156529745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,8,power_law_1.01,0.09455999732017517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,8,power_law_1.01,0.09492480158805847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,8,power_law_1.2,0.09500160217285156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,1,8,power_law_1.2,0.09570559859275818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,16,1,balanced,0.056090667843818665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,16,1,balanced,0.05810666580994924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,16,1,power_law_1.01,0.05907840132713318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,16,1,power_law_1.01,0.06021760106086731
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,16,1,power_law_1.2,0.05984640121459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,16,1,power_law_1.2,0.06030719876289368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,2,1,balanced,0.16660799582799277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,2,1,balanced,0.16702934106191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,2,1,power_law_1.01,0.2013887882232666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,2,1,power_law_1.01,0.20151040554046631
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,2,1,power_law_1.2,0.1992640018463135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,2,1,power_law_1.2,0.20161280632019044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,32,1,balanced,0.04269866645336151
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,32,1,balanced,0.04496000210444132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,32,1,power_law_1.01,0.045158401131629944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,32,1,power_law_1.01,0.046265599131584165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,32,1,power_law_1.2,0.04470399916172028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,32,1,power_law_1.2,0.04499199986457825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,4,1,balanced,0.10495466987291972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,4,1,balanced,0.10571199655532837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,4,1,power_law_1.01,0.11542400121688842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,4,1,power_law_1.01,0.11921279430389405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,4,1,power_law_1.2,0.11746560335159302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,4,1,power_law_1.2,0.11886719465255738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,8,1,balanced,0.07250666618347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,8,1,balanced,0.07327466706434886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,8,1,power_law_1.01,0.07836160063743591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,8,1,power_law_1.01,0.07946239709854126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,8,1,power_law_1.2,0.07880319952964783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,16384,2,8,8,1,power_law_1.2,0.0788927972316742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,1,balanced,0.7910239696502686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,1,balanced,0.7917866706848145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,1,power_law_1.01,0.7608128070831299
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,1,power_law_1.01,0.7627967834472656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,1,power_law_1.2,0.7930751800537109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,1,power_law_1.2,0.799955177307129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,128,balanced,0.05309866865475973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,128,balanced,0.05341866612434387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,128,power_law_1.01,0.04881280064582825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,128,power_law_1.01,0.049472001194953916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,128,power_law_1.2,0.04842239916324616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,128,power_law_1.2,0.04976640045642853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,16,balanced,0.11361066500345866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,16,balanced,0.11426132917404175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,16,power_law_1.01,0.0906175971031189
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,16,power_law_1.01,0.09845759868621826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,16,power_law_1.2,0.09516800045967103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,16,power_law_1.2,0.10089600086212158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,2,balanced,0.41513601938883465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,2,balanced,0.4181600014368693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,2,power_law_1.01,0.3989696025848389
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,2,power_law_1.01,0.41212158203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,2,power_law_1.2,0.4283711910247803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,2,power_law_1.2,0.4287744045257568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,256,balanced,0.04780800143877665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,256,balanced,0.04794666667779287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,256,power_law_1.01,0.04535039961338043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,256,power_law_1.01,0.045772799849510194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,256,power_law_1.2,0.044838398694992065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,256,power_law_1.2,0.0449535995721817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,32,balanced,0.15421866377194723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,32,balanced,0.164383997519811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,32,power_law_1.01,0.1316159963607788
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,32,power_law_1.01,0.1459712028503418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,32,power_law_1.2,0.11694719791412353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,32,power_law_1.2,0.1311360001564026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,4,balanced,0.23086400826772055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,4,balanced,0.23155200481414795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,4,power_law_1.01,0.2071552038192749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,4,power_law_1.01,0.21816959381103515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,4,power_law_1.2,0.21476480960845948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,4,power_law_1.2,0.21850879192352296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,64,balanced,0.06785066425800323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,64,balanced,0.07089599967002869
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,64,power_law_1.01,0.061689597368240354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,64,power_law_1.01,0.06308479905128479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,64,power_law_1.2,0.061414402723312375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,64,power_law_1.2,0.06275839805603027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,8,balanced,0.13980799913406372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,8,balanced,0.13992533087730408
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,8,power_law_1.01,0.1259392023086548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,8,power_law_1.01,0.12910079956054688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,8,power_law_1.2,0.12677760124206544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,1,8,power_law_1.2,0.1267840027809143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,16,1,balanced,0.12145066261291504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,16,1,balanced,0.12176533540089925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,16,1,power_law_1.01,0.13210879564285277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,16,1,power_law_1.01,0.1328703999519348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,16,1,power_law_1.2,0.13437440395355224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,16,1,power_law_1.2,0.13578879833221436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,2,1,balanced,0.4221973419189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,2,1,balanced,0.4224693377812703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,2,1,power_law_1.01,0.3999039888381958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,2,1,power_law_1.01,0.4002175807952881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,2,1,power_law_1.2,0.4099775791168213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,2,1,power_law_1.2,0.4108416080474854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,32,1,balanced,0.10322667161623637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,32,1,balanced,0.10355200370152791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,32,1,power_law_1.01,0.11688319444656373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,32,1,power_law_1.01,0.11708159446716308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,32,1,power_law_1.2,0.11771520376205444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,32,1,power_law_1.2,0.11772799491882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,4,1,balanced,0.24055467049280801
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,4,1,balanced,0.24140799045562744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,4,1,power_law_1.01,0.23149440288543702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,4,1,power_law_1.01,0.2319551944732666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,4,1,power_law_1.2,0.23564798831939698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,4,1,power_law_1.2,0.2357503890991211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,8,1,balanced,0.15652267138163248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,8,1,balanced,0.15758400162061056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,8,1,power_law_1.01,0.16190719604492188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,8,1,power_law_1.01,0.16191359758377075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,8,1,power_law_1.2,0.16359039545059204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2048,8,256,8,1,power_law_1.2,0.1639423966407776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,1,balanced,0.7180960178375244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,1,balanced,0.7193706830342611
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,1,power_law_1.01,0.7630527973175049
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,1,power_law_1.01,0.76462721824646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,1,power_law_1.2,0.7921279907226563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,1,power_law_1.2,0.8003456115722656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,16,balanced,0.22859734296798706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,16,balanced,0.22914133469263712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,16,power_law_1.01,0.1713536024093628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,16,power_law_1.01,0.18999040126800537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,16,power_law_1.2,0.1474943995475769
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,16,power_law_1.2,0.15431679487228395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,2,balanced,0.3410133520762126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,2,balanced,0.3415306806564331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,2,power_law_1.01,0.33829119205474856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,2,power_law_1.01,0.34703359603881834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,2,power_law_1.2,0.3547840118408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,2,power_law_1.2,0.35935359001159667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,32,balanced,0.09497599800427754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,32,balanced,0.09649599591890971
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,32,power_law_1.01,0.08525440096855164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,32,power_law_1.01,0.08923519849777221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,32,power_law_1.2,0.0827455997467041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,32,power_law_1.2,0.08572160005569458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,4,balanced,0.1931999921798706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,4,balanced,0.19329599539438883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,4,power_law_1.01,0.1839359998703003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,4,power_law_1.01,0.18825600147247315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,4,power_law_1.2,0.19111039638519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,4,power_law_1.2,0.19839999675750733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,8,balanced,0.15331199765205383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,8,balanced,0.15946666399637857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,8,power_law_1.01,0.1232640027999878
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,8,power_law_1.01,0.12595200538635254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,8,power_law_1.2,0.13115520477294923
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,1,8,power_law_1.2,0.13242239952087403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,2,1,balanced,0.3936479886372884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,2,1,balanced,0.3967573245366414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,2,1,power_law_1.01,0.41347198486328124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,2,1,power_law_1.01,0.42118401527404786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,2,1,power_law_1.2,0.42652158737182616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,2,1,power_law_1.2,0.43155841827392577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,4,1,balanced,0.2506399949391683
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,4,1,balanced,0.25093867381413776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,4,1,power_law_1.01,0.25842559337615967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,4,1,power_law_1.01,0.2585536003112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,4,1,power_law_1.2,0.26017920970916747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,4,1,power_law_1.2,0.26067841053009033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,8,1,balanced,0.15421866377194723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,8,1,balanced,0.15516266226768494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,8,1,power_law_1.01,0.15645439624786378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,8,1,power_law_1.01,0.15672320127487183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,8,1,power_law_1.2,0.15828479528427125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,6144,2560,8,160,8,1,power_law_1.2,0.15956480503082277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,1,balanced,0.9190346399943033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,1,balanced,0.9202986558278402
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,1,power_law_1.01,0.8821824073791504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,1,power_law_1.01,0.8877823829650879
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,1,power_law_1.2,0.9159616470336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,1,power_law_1.2,0.9188544273376464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,128,balanced,0.05806933343410492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,128,balanced,0.05827199916044871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,128,power_law_1.01,0.05297920107841492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,128,power_law_1.01,0.05374720096588135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,128,power_law_1.2,0.05432320237159729
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,128,power_law_1.2,0.05443840026855469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,16,balanced,0.1243946651617686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,16,balanced,0.12748799721399942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,16,power_law_1.01,0.1065600037574768
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,16,power_law_1.01,0.1100160002708435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,16,power_law_1.2,0.10334080457687378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,16,power_law_1.2,0.10368000268936158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,2,balanced,0.4819413423538208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,2,balanced,0.4825386603673299
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,2,power_law_1.01,0.45735678672790525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,2,power_law_1.01,0.4723199844360352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,2,power_law_1.2,0.4866687774658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,2,power_law_1.2,0.492307186126709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,256,balanced,0.05018133421738943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,256,balanced,0.05097599824269613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,256,power_law_1.01,0.04736000001430511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,256,power_law_1.01,0.04766719937324524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,256,power_law_1.2,0.04769279956817627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,256,power_law_1.2,0.047775998711586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,32,balanced,0.1757919987042745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,32,balanced,0.17622933785120645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,32,power_law_1.01,0.14763519763946534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,32,power_law_1.01,0.15204479694366455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,32,power_law_1.2,0.13237119913101197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,32,power_law_1.2,0.13556480407714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,4,balanced,0.262938658396403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,4,balanced,0.2664480010668437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,4,power_law_1.01,0.23420801162719726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,4,power_law_1.01,0.2359999895095825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,4,power_law_1.2,0.24008960723876954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,4,power_law_1.2,0.2479680061340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,64,balanced,0.0774186650911967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,64,balanced,0.07897066573301952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,64,power_law_1.01,0.06908159852027893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,64,power_law_1.01,0.0720192015171051
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,64,power_law_1.2,0.06823040246963501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,64,power_law_1.2,0.0701312005519867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,8,balanced,0.15774400035540262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,8,balanced,0.15871466199556986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,8,power_law_1.01,0.14320000410079955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,8,power_law_1.01,0.1457535982131958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,8,power_law_1.2,0.14137599468231202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,1,8,power_law_1.2,0.14387199878692628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,16,1,balanced,0.13648533821105957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,16,1,balanced,0.1386666695276896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,16,1,power_law_1.01,0.1498047947883606
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,16,1,power_law_1.01,0.1505344033241272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,16,1,power_law_1.2,0.1520959973335266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,16,1,power_law_1.2,0.15226240158081056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,2,1,balanced,0.48822398980458576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,2,1,balanced,0.48853866259257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,2,1,power_law_1.01,0.4579008102416992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,2,1,power_law_1.01,0.46253437995910646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,2,1,power_law_1.2,0.47185277938842773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,2,1,power_law_1.2,0.4810431957244873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,32,1,balanced,0.11553066968917847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,32,1,balanced,0.1162506639957428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,32,1,power_law_1.01,0.12980480194091798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,32,1,power_law_1.01,0.13162879943847655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,32,1,power_law_1.2,0.1341375946998596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,32,1,power_law_1.2,0.13420159816741944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,4,1,balanced,0.27559467156728107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,4,1,balanced,0.2795253396034241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,4,1,power_law_1.01,0.2681600093841553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,4,1,power_law_1.01,0.26975998878479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,4,1,power_law_1.2,0.27260799407958985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,4,1,power_law_1.2,0.27918078899383547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,8,1,balanced,0.17701866229375204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,8,1,balanced,0.17891732851664224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,8,1,power_law_1.01,0.18227200508117675
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,8,1,power_law_1.01,0.18439680337905884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,8,1,power_law_1.2,0.18614399433135986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,256,8,1,power_law_1.2,0.18632960319519043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,1,balanced,1.348639965057373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,1,balanced,1.3486453692118328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,1,power_law_1.01,1.1210559844970702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,1,power_law_1.01,1.1406335830688477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,1,power_law_1.2,1.125875186920166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,1,power_law_1.2,1.1461888313293458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,128,balanced,0.06496533254782359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,128,balanced,0.06622933348019917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,128,power_law_1.01,0.06041600108146668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,128,power_law_1.01,0.06304640173912049
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,128,power_law_1.2,0.061414402723312375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,128,power_law_1.2,0.062438398599624634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,16,balanced,0.17735467354456583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,16,balanced,0.1774453322092692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,16,power_law_1.01,0.12341760396957398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,16,power_law_1.01,0.14640640020370482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,16,power_law_1.2,0.12598400115966796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,16,power_law_1.2,0.14071680307388307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,2,balanced,0.6955733299255371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,2,balanced,0.6968373457590739
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,2,power_law_1.01,0.6036479949951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,2,power_law_1.01,0.6078271865844727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,2,power_law_1.2,0.590822410583496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,2,power_law_1.2,0.5992000102996826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,32,balanced,0.264570673306783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,32,balanced,0.2752586603164673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,32,power_law_1.01,0.21304960250854493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,32,power_law_1.01,0.22469120025634765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,32,power_law_1.2,0.19165439605712892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,32,power_law_1.2,0.20298879146575927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,4,balanced,0.37083733081817627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,4,balanced,0.3720586697260539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,4,power_law_1.01,0.29954559803009034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,4,power_law_1.01,0.3155328035354614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,4,power_law_1.2,0.306822395324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,4,power_law_1.2,0.3135488033294678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,64,balanced,0.14441066980361938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,64,balanced,0.14566399653752646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,64,power_law_1.01,0.12149120569229126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,64,power_law_1.01,0.125273597240448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,64,power_law_1.2,0.1020095944404602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,64,power_law_1.2,0.12120959758758545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,8,balanced,0.21368000904719034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,8,balanced,0.21381866931915283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,8,power_law_1.01,0.16927360296249389
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,8,power_law_1.01,0.1865023970603943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,8,power_law_1.2,0.1750208020210266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,1,8,power_law_1.2,0.19428479671478271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,16,1,balanced,0.176581343015035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,16,1,balanced,0.17779199282328287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,16,1,power_law_1.01,0.17270400524139404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,16,1,power_law_1.01,0.17482880353927613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,16,1,power_law_1.2,0.17495039701461793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,16,1,power_law_1.2,0.1749824047088623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,2,1,balanced,0.7019840081532797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,2,1,balanced,0.7033387025197347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,2,1,power_law_1.01,0.5908671855926514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,2,1,power_law_1.01,0.595142412185669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,2,1,power_law_1.2,0.5941440105438233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,2,1,power_law_1.2,0.5960447788238525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,32,1,balanced,0.14752533038457236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,32,1,balanced,0.14849600195884705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,32,1,power_law_1.01,0.15192960500717162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,32,1,power_law_1.01,0.15205760002136232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,32,1,power_law_1.2,0.1521407961845398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,32,1,power_law_1.2,0.15319039821624755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,4,1,balanced,0.3845599889755249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,4,1,balanced,0.38472533226013184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,4,1,power_law_1.01,0.33376638889312743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,4,1,power_law_1.01,0.334118390083313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,4,1,power_law_1.2,0.33139839172363283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,4,1,power_law_1.2,0.3351295948028564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,8,1,balanced,0.23573867479960123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,8,1,balanced,0.23603200912475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,8,1,power_law_1.01,0.21758079528808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,8,1,power_law_1.01,0.21825919151306153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,8,1,power_law_1.2,0.21772799491882325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,256,7168,2048,8,384,8,1,power_law_1.2,0.22110719680786134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,1,balanced,0.3009066581726074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,1,balanced,0.3033226728439331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,1,power_law_1.01,0.2352447986602783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,1,power_law_1.01,0.2365056037902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,1,power_law_1.2,0.2406912088394165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,1,power_law_1.2,0.24262399673461915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,128,balanced,0.0582239975531896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,128,balanced,0.05863999823729197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,128,power_law_1.01,0.05999360084533691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,128,power_law_1.01,0.060224002599716185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,128,power_law_1.2,0.06599680185317994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,128,power_law_1.2,0.06609920263290406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,16,balanced,0.06599466502666473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,16,balanced,0.06740266581376393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,16,power_law_1.01,0.07394559979438782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,16,power_law_1.01,0.07446399927139283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,16,power_law_1.2,0.08116480112075805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,16,power_law_1.2,0.08495360016822814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,2,balanced,0.15155733625094095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,2,balanced,0.15264532963434854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,2,power_law_1.01,0.15445760488510132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,2,power_law_1.01,0.15991040468215942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,2,power_law_1.2,0.1646463990211487
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,2,power_law_1.2,0.1656767964363098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,32,balanced,0.0602400004863739
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,32,balanced,0.06028800209363302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,32,power_law_1.01,0.06809599995613098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,32,power_law_1.01,0.06952319741249084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,32,power_law_1.2,0.0692736029624939
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,32,power_law_1.2,0.07195519804954528
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,4,balanced,0.10377599795659383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,4,balanced,0.10469866792360942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,4,power_law_1.01,0.11132160425186158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,4,power_law_1.01,0.11701120138168335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,4,power_law_1.2,0.11676160097122193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,4,power_law_1.2,0.12125439643859863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,64,balanced,0.0584853341182073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,64,balanced,0.05881066620349884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,64,power_law_1.01,0.06345599889755249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,64,power_law_1.01,0.06438400149345398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,64,power_law_1.2,0.06661760210990905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,64,power_law_1.2,0.06756479740142822
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,8,balanced,0.07890133559703827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,8,balanced,0.07937066753705342
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,8,power_law_1.01,0.09012479782104492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,8,power_law_1.01,0.0948032021522522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,8,power_law_1.2,0.09359999895095825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,1,8,power_law_1.2,0.09760000109672547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,2,1,balanced,0.20040533939997354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,2,1,balanced,0.20048532883326212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,2,1,power_law_1.01,0.1727552056312561
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,2,1,power_law_1.01,0.17555199861526488
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,2,1,power_law_1.2,0.1747007966041565
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,2,1,power_law_1.2,0.17555840015411378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,4,1,balanced,0.1649333337942759
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,4,1,balanced,0.16709866126378378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,4,1,power_law_1.01,0.14491519927978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,4,1,power_law_1.01,0.14714239835739135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,4,1,power_law_1.2,0.1467967987060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,2048,768,8,128,4,1,power_law_1.2,0.147161602973938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,1,balanced,0.6265866756439209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,1,balanced,0.6277546485265096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,1,power_law_1.01,0.5450304031372071
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,1,power_law_1.01,0.5502143859863281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,1,power_law_1.2,0.569491195678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,1,power_law_1.2,0.5726592063903808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,128,balanced,0.07025066514809926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,128,balanced,0.07062399884064992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,128,power_law_1.01,0.07793279886245727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,128,power_law_1.01,0.07793920040130616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,128,power_law_1.2,0.0858240008354187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,128,power_law_1.2,0.08728960156440735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,16,balanced,0.10148800412813823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,16,balanced,0.10223999619483948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,16,power_law_1.01,0.11440000534057618
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,16,power_law_1.01,0.11756160259246826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,16,power_law_1.2,0.11979520320892334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,16,power_law_1.2,0.12346240282058715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,2,balanced,0.3234986662864685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,2,balanced,0.3249173363049825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,2,power_law_1.01,0.31617279052734376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,2,power_law_1.01,0.33356800079345705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,2,power_law_1.2,0.34358398914337157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,2,power_law_1.2,0.38226559162139895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,256,balanced,0.0697866678237915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,256,balanced,0.07028266787528992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,256,power_law_1.01,0.0722815990447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,256,power_law_1.01,0.0754368007183075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,256,power_law_1.2,0.07909119725227357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,256,power_law_1.2,0.07995520234107971
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,32,balanced,0.08820799986521403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,32,balanced,0.08949333429336548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,32,power_law_1.01,0.09797760248184204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,32,power_law_1.01,0.09943680167198181
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,32,power_law_1.2,0.10294400453567505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,32,power_law_1.2,0.10730240345001221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,4,balanced,0.16870399316151938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,4,balanced,0.16948266824086508
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,4,power_law_1.01,0.21441280841827393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,4,power_law_1.01,0.2147007942199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,4,power_law_1.2,0.21469440460205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,4,power_law_1.2,0.24097280502319335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,64,balanced,0.07306666672229767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,64,balanced,0.07458133498827617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,64,power_law_1.01,0.08731520175933838
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,64,power_law_1.01,0.08946560025215149
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,64,power_law_1.2,0.09388160109519958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,64,power_law_1.2,0.09516800045967103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,8,balanced,0.12576533357302347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,8,balanced,0.1260693371295929
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,8,power_law_1.01,0.14320640563964843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,8,power_law_1.01,0.14431999921798705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,8,power_law_1.2,0.1512063980102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,1,8,power_law_1.2,0.1525887966156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,2,1,balanced,0.397765318552653
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,2,1,balanced,0.42371733983357746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,2,1,power_law_1.01,0.34576001167297366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,2,1,power_law_1.01,0.34824318885803224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,2,1,power_law_1.2,0.3592832088470459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,2,1,power_law_1.2,0.3600768089294434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,4,1,balanced,0.25514666239420575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,4,1,balanced,0.26388800144195557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,4,1,power_law_1.01,0.22907519340515137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,4,1,power_law_1.01,0.2295232057571411
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,4,1,power_law_1.2,0.23598079681396483
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,4,1,power_law_1.2,0.23606400489807128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,8,1,balanced,0.2244053284327189
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,8,1,balanced,0.22525866826375326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,8,1,power_law_1.01,0.21728639602661132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,8,1,power_law_1.01,0.21881599426269532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,8,1,power_law_1.2,0.21996159553527833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,3072,1536,8,256,8,1,power_law_1.2,0.22181758880615235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,1,balanced,0.6639360189437866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,1,balanced,0.6661760012308756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,1,power_law_1.01,0.7250239849090576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,1,power_law_1.01,0.7351232051849366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,1,power_law_1.2,0.7171711921691895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,1,power_law_1.2,0.7458303928375244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,2,balanced,0.37435734272003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,2,balanced,0.37644267082214355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,2,power_law_1.01,0.4874752044677734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,2,power_law_1.01,0.5554815769195557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,2,power_law_1.2,0.5028736114501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,2,power_law_1.2,0.5341695785522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,4,balanced,0.23152534166971842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,4,balanced,0.23215999205907187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,4,power_law_1.01,0.42005119323730467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,4,power_law_1.01,0.43916797637939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,4,power_law_1.2,0.3807615995407104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,4,power_law_1.2,0.44141440391540526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,8,balanced,0.16536532839139303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,8,balanced,0.1664426624774933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,8,power_law_1.01,0.3368383884429932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,8,power_law_1.01,0.34300799369812013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,8,power_law_1.2,0.34911360740661623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,1,8,power_law_1.2,0.35050880908966064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,16,1,balanced,0.12661866346995035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,16,1,balanced,0.12682132919629416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,16,1,power_law_1.01,0.12923519611358641
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,16,1,power_law_1.01,0.12935680150985718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,16,1,power_law_1.2,0.12723840475082399
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,16,1,power_law_1.2,0.12754559516906738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,2,1,balanced,0.3685866594314575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,2,1,balanced,0.3694560130437215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,2,1,power_law_1.01,0.3981184005737305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,2,1,power_law_1.01,0.417190408706665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,2,1,power_law_1.2,0.39767680168151853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,2,1,power_law_1.2,0.4052544116973877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,32,1,balanced,0.11108799775441487
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,32,1,balanced,0.11120532949765523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,32,1,power_law_1.01,0.11071360111236572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,32,1,power_law_1.01,0.11096320152282715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,32,1,power_law_1.2,0.11122560501098633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,32,1,power_law_1.2,0.11123199462890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,4,1,balanced,0.23148266474405924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,4,1,balanced,0.23354132970174155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,4,1,power_law_1.01,0.24827520847320556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,4,1,power_law_1.01,0.2531327962875366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,4,1,power_law_1.2,0.24484479427337646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,4,1,power_law_1.2,0.25039360523223875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,8,1,balanced,0.1629706621170044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,8,1,balanced,0.1644053359826406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,8,1,power_law_1.01,0.17093759775161743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,8,1,power_law_1.01,0.17158399820327758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,8,1,power_law_1.2,0.16447360515594484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,14336,2,8,8,1,power_law_1.2,0.16813440322875978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,1,balanced,0.9676053524017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,1,balanced,0.9842346509297689
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,1,power_law_1.01,0.5200064182281494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,1,power_law_1.01,0.5207039833068847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,1,power_law_1.2,0.5379007816314697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,1,power_law_1.2,0.5391039848327637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,128,balanced,0.08250133196512859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,128,balanced,0.08277333279450734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,128,power_law_1.01,0.09619839787483216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,128,power_law_1.01,0.10001920461654663
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,128,power_law_1.2,0.11008640527725219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,128,power_law_1.2,0.11298559904098511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,16,balanced,0.1113759974638621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,16,balanced,0.11356266339619954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,16,power_law_1.01,0.13374719619750977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,16,power_law_1.01,0.13870079517364503
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,16,power_law_1.2,0.13868800401687623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,16,power_law_1.2,0.14586880207061767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,2,balanced,0.37593599160512287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,2,balanced,0.3760426839192708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,2,power_law_1.01,0.32327680587768554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,2,power_law_1.01,0.3260799884796143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,2,power_law_1.2,0.36768639087677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,2,power_law_1.2,0.3829823970794678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,32,balanced,0.09909866253534953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,32,balanced,0.09939199686050415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,32,power_law_1.01,0.11571199893951416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,32,power_law_1.01,0.11812479496002197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,32,power_law_1.2,0.12522239685058595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,32,power_law_1.2,0.1335744023323059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,4,balanced,0.1811786691347758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,4,balanced,0.18198400735855103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,4,power_law_1.01,0.2082240104675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,4,power_law_1.01,0.21719679832458497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,4,power_law_1.2,0.21818881034851073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,4,power_law_1.2,0.21967999935150145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,64,balanced,0.08741333087285359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,64,balanced,0.08825066685676575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,64,power_law_1.01,0.10305919647216796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,64,power_law_1.01,0.10539519786834717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,64,power_law_1.2,0.11840640306472779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,64,power_law_1.2,0.12092159986495972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,8,balanced,0.13809600472450256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,8,balanced,0.13825600345929465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,8,power_law_1.01,0.15638400316238404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,8,power_law_1.01,0.16248320341110228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,8,power_law_1.2,0.16781439781188964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,1,8,power_law_1.2,0.16874879598617554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,2,1,balanced,0.5537813504536947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,2,1,balanced,0.5552746852238973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,2,1,power_law_1.01,0.32699520587921144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,2,1,power_law_1.01,0.3307584047317505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,2,1,power_law_1.2,0.33695359230041505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,2,1,power_law_1.2,0.3383807897567749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,4,1,balanced,0.363866647084554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,4,1,balanced,0.36713067690531415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,4,1,power_law_1.01,0.252889609336853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,4,1,power_law_1.01,0.29799039363861085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,4,1,power_law_1.2,0.2536767959594727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,4,1,power_law_1.2,0.2539968013763428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,8,1,balanced,0.2920373280843099
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,8,1,balanced,0.2920479973157247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,8,1,power_law_1.01,0.21880319118499755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,8,1,power_law_1.01,0.22195839881896973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,8,1,power_law_1.2,0.22225921154022216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,4096,1536,8,128,8,1,power_law_1.2,0.22831358909606933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,1,balanced,1.2554933230082195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,1,balanced,1.263055960337321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,1,power_law_1.01,1.373971176147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,1,power_law_1.01,1.3924032211303712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,1,power_law_1.2,1.3836095809936524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,1,power_law_1.2,1.4067328453063965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,2,balanced,0.6482186714808146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,2,balanced,0.649237314860026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,2,power_law_1.01,0.8783103942871093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,2,power_law_1.01,0.999846363067627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,2,power_law_1.2,0.902131175994873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,2,power_law_1.2,1.0059391975402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,4,balanced,0.35682666301727295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,4,balanced,0.35972801844278973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,4,power_law_1.01,0.6890304088592529
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,4,power_law_1.01,0.7093760013580322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,4,power_law_1.2,0.7910975933074951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,4,power_law_1.2,0.7921664237976074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,8,balanced,0.22817599773406982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,8,balanced,0.2295466661453247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,8,power_law_1.01,0.5329279899597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,8,power_law_1.01,0.5893760204315186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,8,power_law_1.2,0.5901823997497558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,1,8,power_law_1.2,0.6231040000915528
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,16,1,balanced,0.17775466044743857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,16,1,balanced,0.17781867583592734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,16,1,power_law_1.01,0.1833024024963379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,16,1,power_law_1.01,0.18391679525375365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,16,1,power_law_1.2,0.18097280263900756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,16,1,power_law_1.2,0.18165119886398315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,2,1,balanced,0.5763786633809408
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,2,1,balanced,0.5778666734695435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,2,1,power_law_1.01,0.6339456081390381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,2,1,power_law_1.01,0.6715839862823486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,2,1,power_law_1.2,0.6177599906921387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,2,1,power_law_1.2,0.6319168090820313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,32,1,balanced,0.14853333433469137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,32,1,balanced,0.14890666802724203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,32,1,power_law_1.01,0.14999040365219116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,32,1,power_law_1.01,0.1513152003288269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,32,1,power_law_1.2,0.14937599897384643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,32,1,power_law_1.2,0.1502400040626526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,4,1,balanced,0.3442026774088542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,4,1,balanced,0.3455040057500203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,4,1,power_law_1.01,0.3773567914962769
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,4,1,power_law_1.01,0.3890752077102661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,4,1,power_law_1.2,0.3769344091415405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,4,1,power_law_1.2,0.38246400356292726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,8,1,balanced,0.2368533412615458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,8,1,balanced,0.2368746598561605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,8,1,power_law_1.01,0.24819839000701904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,8,1,power_law_1.01,0.24913280010223388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,8,1,power_law_1.2,0.25180160999298096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,16384,2,8,8,1,power_law_1.2,0.25363199710845946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,1,balanced,1.4706346193949382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,1,balanced,1.5283360481262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,1,power_law_1.01,1.3393856048583985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,1,power_law_1.01,1.3763327598571777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,1,power_law_1.2,1.4011648178100586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,1,power_law_1.2,1.4160767555236817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,128,balanced,0.12103466192881267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,128,balanced,0.12206400434176128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,128,power_law_1.01,0.13251199722290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,128,power_law_1.01,0.13392640352249147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,128,power_law_1.2,0.14455679655075074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,128,power_law_1.2,0.14512640237808228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,16,balanced,0.1736533244450887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,16,balanced,0.17482666174570718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,16,power_law_1.01,0.19912320375442505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,16,power_law_1.01,0.20051200389862062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,16,power_law_1.2,0.22120959758758546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,16,power_law_1.2,0.22410240173339843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,2,balanced,0.6813066800435384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,2,balanced,0.6921813488006592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,2,power_law_1.01,0.7431359767913819
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,2,power_law_1.01,0.772051191329956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,2,power_law_1.2,0.7599232196807861
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,2,power_law_1.2,0.7878143787384033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,256,balanced,0.11932800213495891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,256,balanced,0.11961600184440613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,256,power_law_1.01,0.12704639434814452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,256,power_law_1.01,0.1283903956413269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,256,power_law_1.2,0.13631999492645264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,256,power_law_1.2,0.14232959747314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,32,balanced,0.14468800028165182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,32,balanced,0.1460693379243215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,32,power_law_1.01,0.1640768051147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,32,power_law_1.01,0.16981120109558107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,32,power_law_1.2,0.17173759937286376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,32,power_law_1.2,0.17271679639816284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,4,balanced,0.33719468116760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,4,balanced,0.3393973509470622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,4,power_law_1.01,0.4265535831451416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,4,power_law_1.01,0.4395264148712158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,4,power_law_1.2,0.469817590713501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,4,power_law_1.2,0.5150400161743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,64,balanced,0.12800533572832742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,64,balanced,0.13015466928482056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,64,power_law_1.01,0.14320000410079955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,64,power_law_1.01,0.14445439577102662
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,64,power_law_1.2,0.1565440058708191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,64,power_law_1.2,0.1603008031845093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,8,balanced,0.22617065906524658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,8,balanced,0.22850133975346884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,8,power_law_1.01,0.26791679859161377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,8,power_law_1.01,0.27209599018096925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,8,power_law_1.2,0.2992703914642334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,1,8,power_law_1.2,0.3070847988128662
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,16,1,balanced,0.33669865131378174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,16,1,balanced,0.38365864753723145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,16,1,power_law_1.01,0.33563520908355715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,16,1,power_law_1.01,0.3370944023132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,16,1,power_law_1.2,0.3418303966522217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,16,1,power_law_1.2,0.3668800115585327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,2,1,balanced,0.793941338857015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,2,1,balanced,0.7980266412099203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,2,1,power_law_1.01,0.7663296222686767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,2,1,power_law_1.01,0.7669951915740967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,2,1,power_law_1.2,0.7954624176025391
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,2,1,power_law_1.2,0.803718376159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,32,1,balanced,0.341050664583842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,32,1,balanced,0.3598986864089966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,32,1,power_law_1.01,0.352454400062561
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,32,1,power_law_1.01,0.3930943965911865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,32,1,power_law_1.2,0.35688960552215576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,32,1,power_law_1.2,0.361023998260498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,4,1,balanced,0.4928853511810303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,4,1,balanced,0.4949546655019124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,4,1,power_law_1.01,0.46983041763305666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,4,1,power_law_1.01,0.47097601890563967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,4,1,power_law_1.2,0.4869696140289307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,4,1,power_law_1.2,0.4899903774261475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,8,1,balanced,0.38209601243336994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,8,1,balanced,0.43221867084503174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,8,1,power_law_1.01,0.37175679206848145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,8,1,power_law_1.01,0.3740992069244385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,8,1,power_law_1.2,0.3814912080764771
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2048,8,256,8,1,power_law_1.2,0.3819648027420044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,1,balanced,3.084693272908529
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,1,balanced,3.153301239013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,1,power_law_1.01,1.2755264282226562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,1,power_law_1.01,1.2852352142333985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,1,power_law_1.2,1.3612352371215821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,1,power_law_1.2,1.385862445831299
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,16,balanced,0.1834026575088501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,16,balanced,0.18412800629933676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,16,power_law_1.01,0.21404800415039063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,16,power_law_1.01,0.23112959861755372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,16,power_law_1.2,0.24343678951263428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,16,power_law_1.2,0.249017596244812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,2,balanced,1.2183466752370198
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,2,balanced,1.220922629038493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,2,power_law_1.01,0.691212797164917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,2,power_law_1.01,0.7555583953857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,2,power_law_1.2,0.7982848167419434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,2,power_law_1.2,0.8523391723632813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,32,balanced,0.14778133233388266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,32,balanced,0.14858133594195047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,32,power_law_1.01,0.1824447989463806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,32,power_law_1.01,0.18736000061035157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,32,power_law_1.2,0.18913919925689698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,32,power_law_1.2,0.20524799823760986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,4,balanced,0.38342400391896564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,4,balanced,0.38545068105061847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,4,power_law_1.01,0.4387392044067383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,4,power_law_1.01,0.4643712043762207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,4,power_law_1.2,0.4948416233062744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,4,power_law_1.2,0.5112895965576172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,8,balanced,0.251525342464447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,8,balanced,0.2585546573003133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,8,power_law_1.01,0.2946687936782837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,8,power_law_1.01,0.3040064096450806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,8,power_law_1.2,0.3147455930709839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,1,8,power_law_1.2,0.3253887891769409
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,2,1,balanced,1.6318079630533855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,2,1,balanced,1.6435200373331706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,2,1,power_law_1.01,0.7188159942626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,2,1,power_law_1.01,0.7353343963623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,2,1,power_law_1.2,0.7427199840545654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,2,1,power_law_1.2,0.7578559875488281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,4,1,balanced,0.9323146343231201
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,4,1,balanced,0.9366186459859213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,4,1,power_law_1.01,0.4598656177520752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,4,1,power_law_1.01,0.4599423885345459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,4,1,power_law_1.2,0.46574721336364744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,4,1,power_law_1.2,0.47208318710327146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,8,1,balanced,0.6545600096384684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,8,1,balanced,0.663973331451416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,8,1,power_law_1.01,0.3632128000259399
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,8,1,power_law_1.01,0.3646784067153931
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,8,1,power_law_1.2,0.36595840454101564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,6144,2560,8,160,8,1,power_law_1.2,0.3729856014251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,1,balanced,1.6397013664245605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,1,balanced,1.6997440656026204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,1,power_law_1.01,1.585420799255371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,1,power_law_1.01,1.6016191482543944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,1,power_law_1.2,1.6470527648925781
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,1,power_law_1.2,1.6626623153686524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,128,balanced,0.13588800032933554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,128,balanced,0.13595733046531677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,128,power_law_1.01,0.15032960176467897
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,128,power_law_1.01,0.15096960067749024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,128,power_law_1.2,0.16238720417022706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,128,power_law_1.2,0.16736639738082887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,16,balanced,0.19637866814931235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,16,balanced,0.19710934162139893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,16,power_law_1.01,0.23118081092834472
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,16,power_law_1.01,0.235916805267334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,16,power_law_1.2,0.24552319049835206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,16,power_law_1.2,0.2613055944442749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,2,balanced,0.7655359903971354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,2,balanced,0.7705706755320231
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,2,power_law_1.01,0.8300095558166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,2,power_law_1.01,0.8533056259155274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,2,power_law_1.2,0.8735936164855957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,2,power_law_1.2,0.8862015724182128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,256,balanced,0.13396799564361572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,256,balanced,0.1341973344484965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,256,power_law_1.01,0.14287999868392945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,256,power_law_1.01,0.143340802192688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,256,power_law_1.2,0.1565951943397522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,256,power_law_1.2,0.15820800065994262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,32,balanced,0.16289599736531576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,32,balanced,0.16379200418790182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,32,power_law_1.01,0.18913279771804808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,32,power_law_1.01,0.18926719427108765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,32,power_law_1.2,0.20730879306793212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,32,power_law_1.2,0.21473278999328613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,4,balanced,0.3890186548233032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,4,balanced,0.3898346821467082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,4,power_law_1.01,0.5059711933135986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,4,power_law_1.01,0.5283135890960693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,4,power_law_1.2,0.5355584144592285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,4,power_law_1.2,0.5603519916534424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,64,balanced,0.1469119985898336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,64,balanced,0.14851733048756918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,64,power_law_1.01,0.1647487998008728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,64,power_law_1.01,0.1666111946105957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,64,power_law_1.2,0.17998720407485963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,64,power_law_1.2,0.18021759986877442
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,8,balanced,0.2595413327217102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,8,balanced,0.2602720061937968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,8,power_law_1.01,0.32039680480957033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,8,power_law_1.01,0.3240000009536743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,8,power_law_1.2,0.34037759304046633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,1,8,power_law_1.2,0.35973761081695554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,16,1,balanced,0.38543999195098877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,16,1,balanced,0.4119093418121338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,16,1,power_law_1.01,0.38755838871002196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,16,1,power_law_1.01,0.4166912078857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,16,1,power_law_1.2,0.3908031940460205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,16,1,power_law_1.2,0.3941504001617432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,2,1,balanced,0.8857279618581136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,2,1,balanced,0.8888746897379557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,2,1,power_law_1.01,0.889798355102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,2,1,power_law_1.01,0.9074943542480469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,2,1,power_law_1.2,0.9284223556518555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,2,1,power_law_1.2,0.9304639816284179
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,32,1,balanced,0.3903520107269287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,32,1,balanced,0.3911093473434448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,32,1,power_law_1.01,0.40210561752319335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,32,1,power_law_1.01,0.403718376159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,32,1,power_law_1.2,0.43060479164123533
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,32,1,power_law_1.2,0.4486976146697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,4,1,balanced,0.5561279853185018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,4,1,balanced,0.5585653384526571
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,4,1,power_law_1.01,0.5417727947235107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,4,1,power_law_1.01,0.5501567840576171
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,4,1,power_law_1.2,0.5663424015045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,4,1,power_law_1.2,0.5705088138580322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,8,1,balanced,0.43538133303324383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,8,1,balanced,0.4375786781311035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,8,1,power_law_1.01,0.4314752101898193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,8,1,power_law_1.01,0.43410558700561525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,8,1,power_law_1.2,0.44425601959228517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,256,8,1,power_law_1.2,0.4447296142578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,1,balanced,1.9105706214904785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,1,balanced,2.0247467358907065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,1,power_law_1.01,2.2520383834838866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,1,power_law_1.01,2.2963008880615234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,1,power_law_1.2,2.3643264770507812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,1,power_law_1.2,2.3840255737304688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,128,balanced,0.13828266660372415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,128,balanced,0.14136000474294028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,128,power_law_1.01,0.151910400390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,128,power_law_1.01,0.1523200035095215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,128,power_law_1.2,0.16213760375976563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,128,power_law_1.2,0.16421120166778563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,16,balanced,0.23001599311828613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,16,balanced,0.23003733158111572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,16,power_law_1.01,0.24924159049987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,16,power_law_1.01,0.25226879119873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,16,power_law_1.2,0.2807487964630127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,16,power_law_1.2,0.28612480163574217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,2,balanced,0.8628586928049723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,2,balanced,0.8629493713378906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,2,power_law_1.01,1.0258943557739257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,2,power_law_1.01,1.0390527725219727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,2,power_law_1.2,1.1056575775146484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,2,power_law_1.2,1.1119487762451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,32,balanced,0.1785279909769694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,32,balanced,0.18002132574717203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,32,power_law_1.01,0.19443199634552003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,32,power_law_1.01,0.19642239809036255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,32,power_law_1.2,0.21276800632476806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,32,power_law_1.2,0.21742079257965088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,4,balanced,0.5574826796849569
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,4,balanced,0.5655200084050497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,4,power_law_1.01,0.626803207397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,4,power_law_1.01,0.6663936138153076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,4,power_law_1.2,0.6232192039489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,4,power_law_1.2,0.6759871959686279
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,64,balanced,0.1569813291231791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,64,balanced,0.15710933009783426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,64,power_law_1.01,0.16482559442520142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,64,power_law_1.01,0.16966400146484376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,64,power_law_1.2,0.18083839416503905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,64,power_law_1.2,0.18190720081329345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,8,balanced,0.3269173304239909
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,8,balanced,0.32901867230733234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,8,power_law_1.01,0.35320320129394533
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,8,power_law_1.01,0.35694079399108886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,8,power_law_1.2,0.3859519958496094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,1,8,power_law_1.2,0.39108479022979736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,16,1,balanced,0.40987201531728107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,16,1,balanced,0.4122026761372884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,16,1,power_law_1.01,0.45187201499938967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,16,1,power_law_1.01,0.4521599769592285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,16,1,power_law_1.2,0.4571648120880127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,16,1,power_law_1.2,0.4580416202545166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,2,1,balanced,1.0422933101654053
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,2,1,balanced,1.0619466304779053
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,2,1,power_law_1.01,1.2213760375976563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,2,1,power_law_1.01,1.2306943893432618
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,2,1,power_law_1.2,1.2619008064270019
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,2,1,power_law_1.2,1.2666751861572265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,32,1,balanced,0.3778880039850871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,32,1,balanced,0.3792213201522827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,32,1,power_law_1.01,0.4112959861755371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,32,1,power_law_1.01,0.4118015766143799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,32,1,power_law_1.2,0.4159423828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,32,1,power_law_1.2,0.4165952205657959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,4,1,balanced,0.6597066720326742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,4,1,balanced,0.6603039900461832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,4,1,power_law_1.01,0.7447807788848877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,4,1,power_law_1.01,0.7455808162689209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,4,1,power_law_1.2,0.7768832206726074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,4,1,power_law_1.2,0.7818751811981202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,8,1,balanced,0.4848159948984782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,8,1,balanced,0.48531198501586914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,8,1,power_law_1.01,0.5345983982086182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,8,1,power_law_1.01,0.5353087902069091
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,8,1,power_law_1.2,0.547711992263794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,3072,7168,2048,8,384,8,1,power_law_1.2,0.551468801498413
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,1,balanced,0.08122133215268452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,1,balanced,0.0814879983663559
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,1,power_law_1.01,0.07166720032691956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,1,power_law_1.01,0.07170559763908387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,1,power_law_1.2,0.06899200081825256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,1,power_law_1.2,0.07045120000839233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,128,balanced,0.033413333197434746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,128,balanced,0.033471999069054924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,128,power_law_1.01,0.03129599988460541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,128,power_law_1.01,0.03226880133152008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,128,power_law_1.2,0.030656000971794127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,128,power_law_1.2,0.03139199912548065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,16,balanced,0.02826666583617528
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,16,balanced,0.029306667546431225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,16,power_law_1.01,0.026579201221466064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,16,power_law_1.01,0.026771199703216553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,16,power_law_1.2,0.026841598749160766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,16,power_law_1.2,0.02720000147819519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,2,balanced,0.05604266623655955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,2,balanced,0.057429333527882896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,2,power_law_1.01,0.05129600167274475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,2,power_law_1.01,0.051846402883529666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,2,power_law_1.2,0.05052800178527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,2,power_law_1.2,0.05289599895477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,32,balanced,0.029359998802344005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,32,balanced,0.029626667499542236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,32,power_law_1.01,0.02752000093460083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,32,power_law_1.01,0.02770560085773468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,32,power_law_1.2,0.026092800498008727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,32,power_law_1.2,0.026668798923492432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,4,balanced,0.036042665441830955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,4,balanced,0.03741333385308584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,4,power_law_1.01,0.03338240087032318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,4,power_law_1.01,0.03461120128631592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,4,power_law_1.2,0.03235200047492981
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,4,power_law_1.2,0.033529600501060484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,64,balanced,0.027349332968393963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,64,balanced,0.029578665892283123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,64,power_law_1.01,0.026099199056625368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,64,power_law_1.01,0.02775680124759674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,64,power_law_1.2,0.026310399174690247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,64,power_law_1.2,0.026425600051879883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,8,balanced,0.0314026673634847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,8,balanced,0.031514666974544525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,8,power_law_1.01,0.028518399596214293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,8,power_law_1.01,0.02871040105819702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,8,power_law_1.2,0.02932479977607727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,1,8,power_law_1.2,0.029478400945663452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,2,1,balanced,0.05841066439946493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,2,1,balanced,0.06010133524735769
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,2,1,power_law_1.01,0.0515392005443573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,2,1,power_law_1.01,0.052767997980117796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,2,1,power_law_1.2,0.050547200441360476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,2,1,power_law_1.2,0.05120000243186951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,4,1,balanced,0.03979199876387914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,4,1,balanced,0.039813332259655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,4,1,power_law_1.01,0.03581439852714539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,4,1,power_law_1.01,0.036083200573921205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,4,1,power_law_1.2,0.03670400083065033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,2048,768,8,128,4,1,power_law_1.2,0.03683840036392212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,1,balanced,0.3078933358192444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,1,balanced,0.30938132603963214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,1,power_law_1.01,0.1716863989830017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,1,power_law_1.01,0.1727679967880249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,1,power_law_1.2,0.15982719659805297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,1,power_law_1.2,0.1609984040260315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,128,balanced,0.029472000896930695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,128,balanced,0.029685333371162415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,128,power_law_1.01,0.028249600529670717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,128,power_law_1.01,0.028569599986076354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,128,power_law_1.2,0.027820798754692077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,128,power_law_1.2,0.028531199693679808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,16,balanced,0.04896533489227295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,16,balanced,0.05009600023428599
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,16,power_law_1.01,0.03975679874420166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,16,power_law_1.01,0.04312320053577423
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,16,power_law_1.2,0.03934719860553741
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,16,power_law_1.2,0.042444801330566405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,2,balanced,0.17060265938440958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,2,balanced,0.17125332355499268
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,2,power_law_1.01,0.10374399423599243
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,2,power_law_1.01,0.11006720066070556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,2,power_law_1.2,0.10241279602050782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,2,power_law_1.2,0.10846079587936401
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,256,balanced,0.03579733272393545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,256,balanced,0.03612799942493439
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,256,power_law_1.01,0.033030399680137636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,256,power_law_1.01,0.03411200046539307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,256,power_law_1.2,0.03299199938774109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,256,power_law_1.2,0.03381119966506958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,32,balanced,0.03355200091997782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,32,balanced,0.033557333052158356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,32,power_law_1.01,0.029414400458335876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,32,power_law_1.01,0.030534398555755616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,32,power_law_1.2,0.029504001140594482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,32,power_law_1.2,0.030067199468612672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,4,balanced,0.10218133529027303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,4,balanced,0.10270933310190837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,4,power_law_1.01,0.07780479788780212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,4,power_law_1.01,0.08586879968643188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,4,power_law_1.2,0.07504640221595764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,4,power_law_1.2,0.07685760259628296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,64,balanced,0.03133333226044973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,64,balanced,0.03143466760714849
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,64,power_law_1.01,0.02927359938621521
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,64,power_law_1.01,0.031244799494743347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,64,power_law_1.2,0.02910720109939575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,64,power_law_1.2,0.030060800909996032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,8,balanced,0.06744533280531566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,8,balanced,0.0682239979505539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,8,power_law_1.01,0.05475199818611145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,8,power_law_1.01,0.06074240207672119
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,8,power_law_1.2,0.055315202474594115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,1,8,power_law_1.2,0.05980799794197082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,2,1,balanced,0.17421332995096842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,2,1,balanced,0.17527467012405396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,2,1,power_law_1.01,0.10266879796981812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,2,1,power_law_1.01,0.10502400398254394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,2,1,power_law_1.2,0.09749119877815246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,2,1,power_law_1.2,0.09764479994773864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,4,1,balanced,0.10854400197664897
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,4,1,balanced,0.10964266459147136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,4,1,power_law_1.01,0.06804479956626892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,4,1,power_law_1.01,0.0689087986946106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,4,1,power_law_1.2,0.06637439727783204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,4,1,power_law_1.2,0.06810240149497986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,8,1,balanced,0.07936533292134602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,8,1,balanced,0.08006933331489563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,8,1,power_law_1.01,0.05532159805297852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,8,1,power_law_1.01,0.05612800121307373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,8,1,power_law_1.2,0.05255680084228516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,3072,1536,8,256,8,1,power_law_1.2,0.05294079780578613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,1,balanced,0.14144532879193625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,1,balanced,0.1418293317159017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,1,power_law_1.01,0.1528831958770752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,1,power_law_1.01,0.1580672025680542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,1,power_law_1.2,0.15518720149993898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,1,power_law_1.2,0.15730559825897217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,2,balanced,0.08640533685684204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,2,balanced,0.08684800068537395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,2,power_law_1.01,0.09797760248184204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,2,power_law_1.01,0.09882240295410157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,2,power_law_1.2,0.09930239915847779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,2,power_law_1.2,0.10069760084152221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,4,balanced,0.059792002042134605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,4,balanced,0.06172800064086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,4,power_law_1.01,0.06225919723510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,4,power_law_1.01,0.06277120113372803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,4,power_law_1.2,0.06277120113372803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,4,power_law_1.2,0.06428160071372986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,8,balanced,0.047744000951449074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,8,balanced,0.04826133449872335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,8,power_law_1.01,0.04655359983444214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,8,power_law_1.01,0.04687359929084778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,8,power_law_1.2,0.04656639993190766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,1,8,power_law_1.2,0.04793600142002106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,16,1,balanced,0.029578665892283123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,16,1,balanced,0.029893333713213604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,16,1,power_law_1.01,0.029977598786354066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,16,1,power_law_1.01,0.031513598561286923
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,16,1,power_law_1.2,0.030003198981285097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,16,1,power_law_1.2,0.030079999566078187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,2,1,balanced,0.08526399731636047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,2,1,balanced,0.08624000350634257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,2,1,power_law_1.01,0.0890175998210907
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,2,1,power_law_1.01,0.09052799940109253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,2,1,power_law_1.2,0.0902400016784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,2,1,power_law_1.2,0.09079679846763611
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,32,1,balanced,0.027402666707833607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,32,1,balanced,0.027503999571005504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,32,1,power_law_1.01,0.026732799410820008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,32,1,power_law_1.01,0.028115200996398925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,32,1,power_law_1.2,0.02680320143699646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,32,1,power_law_1.2,0.028115200996398925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,4,1,balanced,0.05786666770776113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,4,1,balanced,0.05821333328882853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,4,1,power_law_1.01,0.05861759781837463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,4,1,power_law_1.01,0.05932160019874573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,4,1,power_law_1.2,0.05865600109100342
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,4,1,power_law_1.2,0.059443199634552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,8,1,balanced,0.03822399924198786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,8,1,balanced,0.03830400109291077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,8,1,power_law_1.01,0.04154880046844482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,8,1,power_law_1.01,0.04226559996604919
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,8,1,power_law_1.2,0.04222719967365265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,14336,2,8,8,1,power_law_1.2,0.04314880073070526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,1,balanced,0.22034132480621338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,1,balanced,0.22034666935602823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,1,power_law_1.01,0.1821887969970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,1,power_law_1.01,0.18698240518569947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,1,power_law_1.2,0.18462079763412476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,1,power_law_1.2,0.1853503942489624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,128,balanced,0.037605332831541695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,128,balanced,0.03774933268626531
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,128,power_law_1.01,0.0358271986246109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,128,power_law_1.01,0.03585920035839081
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,128,power_law_1.2,0.03498240113258362
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,128,power_law_1.2,0.0355648010969162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,16,balanced,0.03457066665093104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,16,balanced,0.035317334036032356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,16,power_law_1.01,0.03524479866027832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,16,power_law_1.01,0.03560959994792938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,16,power_law_1.2,0.03534719944000244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,16,power_law_1.2,0.035436800122261046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,2,balanced,0.12575999895731607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,2,balanced,0.12684266765912375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,2,power_law_1.01,0.11170560121536255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,2,power_law_1.01,0.11180800199508667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,2,power_law_1.2,0.11166080236434936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,2,power_law_1.2,0.11306240558624267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,32,balanced,0.033370666205883026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,32,balanced,0.03346133232116699
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,32,power_law_1.01,0.030483201146125793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,32,power_law_1.01,0.030752000212669373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,32,power_law_1.2,0.030099201202392577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,32,power_law_1.2,0.03043839931488037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,4,balanced,0.08024533092975616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,4,balanced,0.08065600196520488
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,4,power_law_1.01,0.07092480063438415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,4,power_law_1.01,0.07331839799880982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,4,power_law_1.2,0.07034239768981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,4,power_law_1.2,0.07084159851074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,64,balanced,0.031317333380381264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,64,balanced,0.03344533344109853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,64,power_law_1.01,0.03000960052013397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,64,power_law_1.01,0.0313728004693985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,64,power_law_1.2,0.030028799176216127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,64,power_law_1.2,0.03121280074119568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,8,balanced,0.05574400226275126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,8,balanced,0.05808533231417338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,8,power_law_1.01,0.05070080161094666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,8,power_law_1.01,0.05144960284233093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,8,power_law_1.2,0.051692801713943484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,1,8,power_law_1.2,0.052908802032470705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,2,1,balanced,0.1281706690788269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,2,1,balanced,0.13013333082199097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,2,1,power_law_1.01,0.10882560014724732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,2,1,power_law_1.01,0.11292159557342529
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,2,1,power_law_1.2,0.1098688006401062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,2,1,power_law_1.2,0.11106560230255128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,4,1,balanced,0.0823520024617513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,4,1,balanced,0.08378133177757263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,4,1,power_law_1.01,0.0726144015789032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,4,1,power_law_1.01,0.07269759774208069
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,4,1,power_law_1.2,0.07112320065498352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,4,1,power_law_1.2,0.07299839854240417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,8,1,balanced,0.062319998939832054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,8,1,balanced,0.06400533517201741
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,8,1,power_law_1.01,0.05742719769477844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,8,1,power_law_1.01,0.05751039981842041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,8,1,power_law_1.2,0.05668479800224304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,4096,1536,8,128,8,1,power_law_1.2,0.057004797458648684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,1,balanced,0.22075200080871582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,1,balanced,0.2214346726735433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,1,power_law_1.01,0.28935680389404295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,1,power_law_1.01,0.290393590927124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,1,power_law_1.2,0.28255999088287354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,1,power_law_1.2,0.291212797164917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,2,balanced,0.12839466333389282
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,2,balanced,0.12922666470209757
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,2,power_law_1.01,0.16951040029525757
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,2,power_law_1.01,0.17087359428405763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,2,power_law_1.2,0.1657920002937317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,2,power_law_1.2,0.18024959564208984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,4,balanced,0.07911466558774312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,4,balanced,0.08032533526420593
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,4,power_law_1.01,0.091839998960495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,4,power_law_1.01,0.09493119716644287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,4,power_law_1.2,0.08700159788131714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,4,power_law_1.2,0.0878271996974945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,8,balanced,0.0603413333495458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,8,balanced,0.06232533355553945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,8,power_law_1.01,0.058534401655197146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,8,power_law_1.01,0.05948160290718078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,8,power_law_1.2,0.0590719997882843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,1,8,power_law_1.2,0.06037120223045349
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,16,1,balanced,0.03347733368476232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,16,1,balanced,0.03387733300526937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,16,1,power_law_1.01,0.03768320083618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,16,1,power_law_1.01,0.03815680146217346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,16,1,power_law_1.2,0.038252800703048706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,16,1,power_law_1.2,0.03849599957466125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,2,1,balanced,0.12495999534924825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,2,1,balanced,0.1276479959487915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,2,1,power_law_1.01,0.13408000469207765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,2,1,power_law_1.01,0.13423360586166383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,2,1,power_law_1.2,0.13482240438461304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,2,1,power_law_1.2,0.13485440015792846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,32,1,balanced,0.029215998947620392
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,32,1,balanced,0.03052799900372823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,32,1,power_law_1.01,0.02929919958114624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,32,1,power_law_1.01,0.029491201043128967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,32,1,power_law_1.2,0.029068800806999206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,32,1,power_law_1.2,0.029183998703956604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,4,1,balanced,0.07854400078455608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,4,1,balanced,0.07931200166543324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,4,1,power_law_1.01,0.08116480112075805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,4,1,power_law_1.01,0.08436480164527893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,4,1,power_law_1.2,0.08115839958190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,4,1,power_law_1.2,0.08229759931564332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,8,1,balanced,0.05398933092753092
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,8,1,balanced,0.05435733497142792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,8,1,power_law_1.01,0.0541055977344513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,8,1,power_law_1.01,0.054655998945236206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,8,1,power_law_1.2,0.05378559827804565
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,16384,2,8,8,1,power_law_1.2,0.05503360033035278
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,1,balanced,0.7660160064697266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,1,balanced,0.7682720025380453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,1,power_law_1.01,0.39883520603179934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,1,power_law_1.01,0.4010303974151611
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,1,power_law_1.2,0.3636543989181519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,1,power_law_1.2,0.36615040302276614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,128,balanced,0.035631999373435974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,128,balanced,0.03572800010442734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,128,power_law_1.01,0.03375999927520752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,128,power_law_1.01,0.034944000840187076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,128,power_law_1.2,0.03333120048046112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,128,power_law_1.2,0.034560000896453856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,16,balanced,0.0790719985961914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,16,balanced,0.08071466783682506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,16,power_law_1.01,0.07063680291175842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,16,power_law_1.01,0.07144320011138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,16,power_law_1.2,0.06926079988479614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,16,power_law_1.2,0.06977279782295227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,2,balanced,0.399946649869283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,2,balanced,0.4019306500752767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,2,power_law_1.01,0.21996800899505614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,2,power_law_1.01,0.23575680255889891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,2,power_law_1.2,0.22929279804229735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,2,power_law_1.2,0.2415616035461426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,256,balanced,0.039813332259655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,256,balanced,0.04116799930731455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,256,power_law_1.01,0.03964160084724426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,256,power_law_1.01,0.03994880020618439
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,256,power_law_1.2,0.038950398564338684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,256,power_law_1.2,0.03911679983139038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,32,balanced,0.05409066875775655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,32,balanced,0.05653333167235056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,32,power_law_1.01,0.04644480049610138
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,32,power_law_1.01,0.05275520086288452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,32,power_law_1.2,0.04567039906978607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,32,power_law_1.2,0.04855040013790131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,4,balanced,0.21753066778182983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,4,balanced,0.2185653249422709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,4,power_law_1.01,0.14220160245895386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,4,power_law_1.01,0.14824960231781006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,4,power_law_1.2,0.13686399459838866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,4,power_law_1.2,0.16583679914474486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,64,balanced,0.03675200045108795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,64,balanced,0.038015998899936676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,64,power_law_1.01,0.03504000008106232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,64,power_law_1.01,0.03518719971179962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,64,power_law_1.2,0.03524479866027832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,64,power_law_1.2,0.035718399286270144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,8,balanced,0.1262399951616923
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,8,balanced,0.12702932953834534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,8,power_law_1.01,0.09772800207138062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,8,power_law_1.01,0.11436159610748291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,8,power_law_1.2,0.09330559968948364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,1,8,power_law_1.2,0.10209920406341552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,16,1,balanced,0.10355732838312785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,16,1,balanced,0.10511466860771179
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,16,1,power_law_1.01,0.06871039867401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,16,1,power_law_1.01,0.06993280053138733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,16,1,power_law_1.2,0.06663680076599121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,16,1,power_law_1.2,0.06689919829368592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,2,1,balanced,0.40143465995788574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,2,1,balanced,0.4021173318227132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,2,1,power_law_1.01,0.21833600997924804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,2,1,power_law_1.01,0.220633602142334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,2,1,power_law_1.2,0.19690239429473877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,2,1,power_law_1.2,0.2020672082901001
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,32,1,balanced,0.08680533369382222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,32,1,balanced,0.08859200278917949
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,32,1,power_law_1.01,0.05763840079307556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,32,1,power_law_1.01,0.058911997079849246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,32,1,power_law_1.2,0.055353599786758426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,32,1,power_law_1.2,0.05586559772491455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,4,1,balanced,0.22167466084162393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,4,1,balanced,0.22168533007303873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,4,1,power_law_1.01,0.13006080389022828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,4,1,power_law_1.01,0.1315775990486145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,4,1,power_law_1.2,0.12001279592514039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,4,1,power_law_1.2,0.12170239686965942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,8,1,balanced,0.13741866747538248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,8,1,balanced,0.13768532872200012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,8,1,power_law_1.01,0.08737919926643371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,8,1,power_law_1.01,0.08874880075454712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,8,1,power_law_1.2,0.08353279829025269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2048,8,256,8,1,power_law_1.2,0.0839680016040802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,1,balanced,0.6076373259226481
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,1,balanced,0.6092426776885986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,1,power_law_1.01,0.465715217590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,1,power_law_1.01,0.4841792106628418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,1,power_law_1.2,0.46606078147888186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,1,power_law_1.2,0.4710207939147949
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,16,balanced,0.06842133402824402
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,16,balanced,0.06902933120727539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,16,power_law_1.01,0.06500480175018311
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,16,power_law_1.01,0.06517120003700257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,16,power_law_1.2,0.06305919885635376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,16,power_law_1.2,0.06577919721603394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,2,balanced,0.3216373324394226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,2,balanced,0.32310400406519574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,2,power_law_1.01,0.26721920967102053
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,2,power_law_1.01,0.2677056074142456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,2,power_law_1.2,0.2573632001876831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,2,power_law_1.2,0.27210240364074706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,32,balanced,0.053717335065205894
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,32,balanced,0.054042667150497437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,32,power_law_1.01,0.050483202934265135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,32,power_law_1.01,0.05069440007209778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,32,power_law_1.2,0.05009920001029968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,32,power_law_1.2,0.0516543984413147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,4,balanced,0.17781333128611246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,4,balanced,0.1782346765200297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,4,power_law_1.01,0.15148160457611085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,4,power_law_1.01,0.15568000078201294
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,4,power_law_1.2,0.15130879878997802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,4,power_law_1.2,0.15712000131607057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,8,balanced,0.10599467158317566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,8,balanced,0.10619200269381206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,8,power_law_1.01,0.09205120205879211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,8,power_law_1.01,0.10019840002059936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,8,power_law_1.2,0.09566079974174499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,1,8,power_law_1.2,0.09721599817276001
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,2,1,balanced,0.3234666585922241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,2,1,balanced,0.3248853286107381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,2,1,power_law_1.01,0.25509119033813477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,2,1,power_law_1.01,0.25793919563293455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,2,1,power_law_1.2,0.25541119575500487
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,2,1,power_law_1.2,0.2581952095031738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,4,1,balanced,0.18762133518854776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,4,1,balanced,0.18827199935913086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,4,1,power_law_1.01,0.15168639421463012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,4,1,power_law_1.01,0.1517184019088745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,4,1,power_law_1.2,0.15193599462509155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,4,1,power_law_1.2,0.15407999753952026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,8,1,balanced,0.11218667030334473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,8,1,balanced,0.11274133125940959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,8,1,power_law_1.01,0.0948032021522522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,8,1,power_law_1.01,0.0953279972076416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,8,1,power_law_1.2,0.09324799776077271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,6144,2560,8,160,8,1,power_law_1.2,0.09463040232658386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,1,balanced,0.8904106616973877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,1,balanced,0.8905759652455648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,1,power_law_1.01,0.4738944053649902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,1,power_law_1.01,0.4813055992126465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,1,power_law_1.2,0.42113280296325684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,1,power_law_1.2,0.44204158782958985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,128,balanced,0.03762666632731756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,128,balanced,0.0377866675456365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,128,power_law_1.01,0.0350847989320755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,128,power_law_1.01,0.035622400045394895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,128,power_law_1.2,0.035257598757743834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,128,power_law_1.2,0.03633280098438263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,16,balanced,0.0865066647529602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,16,balanced,0.08709866801897685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,16,power_law_1.01,0.06899840235710145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,16,power_law_1.01,0.07006080150604248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,16,power_law_1.2,0.06548479795455933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,16,power_law_1.2,0.07538560032844543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,2,balanced,0.4629280169804891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,2,balanced,0.4636586507161458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,2,power_law_1.01,0.25797760486602783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,2,power_law_1.01,0.2763776063919067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,2,power_law_1.2,0.25207679271697997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,2,power_law_1.2,0.2781055927276611
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,256,balanced,0.04380266865094503
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,256,balanced,0.04387733340263367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,256,power_law_1.01,0.041510400176048276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,256,power_law_1.01,0.04167680144309997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,256,power_law_1.2,0.04020479917526245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,256,power_law_1.2,0.04190079867839813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,32,balanced,0.05845333139101664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,32,balanced,0.06019733349482218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,32,power_law_1.01,0.053324800729751584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,32,power_law_1.01,0.056883198022842404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,32,power_law_1.2,0.050732797384262084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,32,power_law_1.2,0.051475197076797485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,4,balanced,0.24781332413355509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,4,balanced,0.24809600909550986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,4,power_law_1.01,0.17938560247421265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,4,power_law_1.01,0.18627840280532837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,4,power_law_1.2,0.14775680303573607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,4,power_law_1.2,0.17432960271835327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,64,balanced,0.044154668847719826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,64,balanced,0.04586133360862732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,64,power_law_1.01,0.03713279962539673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,64,power_law_1.01,0.03909760117530823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,64,power_law_1.2,0.039078399538993835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,64,power_law_1.2,0.040729600191116336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,8,balanced,0.1414186656475067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,8,balanced,0.14194666345914206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,8,power_law_1.01,0.10373760461807251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,8,power_law_1.01,0.11310720443725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,8,power_law_1.2,0.11634559631347656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,1,8,power_law_1.2,0.11959680318832397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,16,1,balanced,0.11538666486740112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,16,1,balanced,0.11673067013422649
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,16,1,power_law_1.01,0.07703040242195129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,16,1,power_law_1.01,0.07744640111923218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,16,1,power_law_1.2,0.07288320064544677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,16,1,power_law_1.2,0.07459200024604798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,2,1,balanced,0.46369067827860516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,2,1,balanced,0.4643839995066325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,2,1,power_law_1.01,0.2479680061340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,2,1,power_law_1.01,0.2589119911193848
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,2,1,power_law_1.2,0.2321023941040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,2,1,power_law_1.2,0.23331201076507568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,32,1,balanced,0.09702400366465251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,32,1,balanced,0.09705600142478943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,32,1,power_law_1.01,0.0657151997089386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,32,1,power_law_1.01,0.06607360243797303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,32,1,power_law_1.2,0.06307200193405152
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,32,1,power_law_1.2,0.06340479850769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,4,1,balanced,0.2516213258107503
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,4,1,balanced,0.25244800249735516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,4,1,power_law_1.01,0.14670720100402831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,4,1,power_law_1.01,0.1486143946647644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,4,1,power_law_1.2,0.1355072021484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,4,1,power_law_1.2,0.13640320301055908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,8,1,balanced,0.1541866660118103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,8,1,balanced,0.15614400307337442
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,8,1,power_law_1.01,0.09670400023460388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,8,1,power_law_1.01,0.09749760031700135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,8,1,power_law_1.2,0.09035519957542419
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,256,8,1,power_law_1.2,0.09340159893035889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,1,balanced,0.8908586502075195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,1,balanced,0.8925706545511881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,1,power_law_1.01,0.5925183773040772
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,1,power_law_1.01,0.5937856197357178
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,1,power_law_1.2,0.5226175785064697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,1,power_law_1.2,0.5300096035003662
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,128,balanced,0.03737599899371465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,128,balanced,0.0377813329299291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,128,power_law_1.01,0.03792639970779419
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,128,power_law_1.01,0.03802880048751831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,128,power_law_1.2,0.037273600697517395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,128,power_law_1.2,0.03829120099544525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,16,balanced,0.08753599723180135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,16,balanced,0.08854400118192036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,16,power_law_1.01,0.1122048020362854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,16,power_law_1.01,0.11221120357513428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,16,power_law_1.2,0.10460159778594971
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,16,power_law_1.2,0.10620160102844238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,2,balanced,0.46164798736572266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,2,balanced,0.463648001352946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,2,power_law_1.01,0.33632640838623046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,2,power_law_1.01,0.3392064094543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,2,power_law_1.2,0.3131648063659668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,2,power_law_1.2,0.32576000690460205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,32,balanced,0.060165335734685264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,32,balanced,0.061280002196629844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,32,power_law_1.01,0.06883199810981751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,32,power_law_1.01,0.06972159743309021
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,32,power_law_1.2,0.06114559769630432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,32,power_law_1.2,0.06270719766616821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,4,balanced,0.24686932563781738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,4,balanced,0.24837867418924967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,4,power_law_1.01,0.22456319332122804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,4,power_law_1.01,0.23123199939727784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,4,power_law_1.2,0.21465599536895752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,4,power_law_1.2,0.2192768096923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,64,balanced,0.044863998889923096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,64,balanced,0.04589866598447164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,64,power_law_1.01,0.051692801713943484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,64,power_law_1.01,0.054630398750305176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,64,power_law_1.2,0.047219198942184445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,64,power_law_1.2,0.047244799137115476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,8,balanced,0.14125333229700723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,8,balanced,0.14194132884343466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,8,power_law_1.01,0.17604479789733887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,8,power_law_1.01,0.1834239959716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,8,power_law_1.2,0.1804159998893738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,1,8,power_law_1.2,0.18718719482421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,16,1,balanced,0.1156160036722819
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,16,1,balanced,0.11744532982508342
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,16,1,power_law_1.01,0.08917760252952575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,16,1,power_law_1.01,0.08979840278625488
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,16,1,power_law_1.2,0.0816703975200653
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,16,1,power_law_1.2,0.08328959941864014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,2,1,balanced,0.46455466747283936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,2,1,balanced,0.4649493296941121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,2,1,power_law_1.01,0.3092992067337036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,2,1,power_law_1.01,0.31741440296173096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,2,1,power_law_1.2,0.28266239166259766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,2,1,power_law_1.2,0.28695039749145507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,32,1,balanced,0.09697600205739339
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,32,1,balanced,0.09755733609199524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,32,1,power_law_1.01,0.07616000175476074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,32,1,power_law_1.01,0.0785535991191864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,32,1,power_law_1.2,0.07007359862327575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,32,1,power_law_1.2,0.07085440158843995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,4,1,balanced,0.25255467494328815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,4,1,balanced,0.25296000639597577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,4,1,power_law_1.01,0.17328640222549438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,4,1,power_law_1.01,0.17388800382614136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,4,1,power_law_1.2,0.15946240425109864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,8,1,balanced,0.15451733271280924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,8,1,balanced,0.15461867054303488
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,8,1,power_law_1.01,0.11205120086669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,8,1,power_law_1.01,0.11455359458923339
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,8,1,power_law_1.2,0.10586240291595458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,32,7168,2048,8,384,8,1,power_law_1.2,0.10649600028991699
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,1,balanced,0.09939199686050415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,1,balanced,0.10071466366449992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,1,power_law_1.01,0.09477120041847228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,1,power_law_1.01,0.0950976014137268
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,1,power_law_1.2,0.0961471974849701
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,1,power_law_1.2,0.09713280200958252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,128,balanced,0.03745600084463755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,128,balanced,0.03746666759252548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,128,power_law_1.01,0.035692799091339114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,128,power_law_1.01,0.0359360009431839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,128,power_law_1.2,0.035724800825119016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,128,power_law_1.2,0.03590399920940399
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,16,balanced,0.03952533255020777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,16,balanced,0.03965333352486292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,16,power_law_1.01,0.038252800703048706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,16,power_law_1.01,0.03840000033378601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,16,power_law_1.2,0.03863680064678192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,16,power_law_1.2,0.03871999979019165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,2,balanced,0.06225066880385081
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,2,balanced,0.062261333068211876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,2,power_law_1.01,0.06197119951248169
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,2,power_law_1.01,0.06321280002593994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,2,power_law_1.2,0.06440960168838501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,2,power_law_1.2,0.06512640118598938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,32,balanced,0.03942933430274328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,32,balanced,0.03949866692225138
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,32,power_law_1.01,0.03694719970226288
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,32,power_law_1.01,0.03696640133857727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,32,power_law_1.2,0.036396801471710205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,32,power_law_1.2,0.03696640133857727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,4,balanced,0.053413331508636475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,4,balanced,0.054757331808408104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,4,power_law_1.01,0.04836480021476745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,4,power_law_1.01,0.04839679896831513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,4,power_law_1.2,0.048563200235366824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,4,power_law_1.2,0.05059199929237366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,64,balanced,0.03750933210055033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,64,balanced,0.03766400118668874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,64,power_law_1.01,0.036134400963783266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,64,power_law_1.01,0.03625600039958954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,64,power_law_1.2,0.03632639944553375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,64,power_law_1.2,0.03701759874820709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,8,balanced,0.06213866670926412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,8,balanced,0.06850666801134746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,8,power_law_1.01,0.055193597078323366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,8,power_law_1.01,0.05559679865837097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,8,power_law_1.2,0.049747198820114136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,1,8,power_law_1.2,0.05539199709892273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,2,1,balanced,0.07056533296902974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,2,1,balanced,0.07238933444023132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,2,1,power_law_1.01,0.066975998878479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,2,1,power_law_1.01,0.06706560254096985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,2,1,power_law_1.2,0.06712960004806519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,2,1,power_law_1.2,0.06878079771995545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,4,1,balanced,0.0582239975531896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,4,1,balanced,0.06002666552861532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,4,1,power_law_1.01,0.05466880202293396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,4,1,power_law_1.01,0.05589119791984558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,4,1,power_law_1.2,0.05581439733505249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,2048,768,8,128,4,1,power_law_1.2,0.05617920160293579
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,1,balanced,0.35469333330790204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,1,balanced,0.3590346574783325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,1,power_law_1.01,0.3241791963577271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,1,power_law_1.01,0.3266304016113281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,1,power_law_1.2,0.3387648105621338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,1,power_law_1.2,0.3469311952590942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,128,balanced,0.04147200038035711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,128,balanced,0.041562666495641075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,128,power_law_1.01,0.039027199149131775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,128,power_law_1.01,0.03940480053424835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,128,power_law_1.2,0.03883520066738129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,128,power_law_1.2,0.03958399891853333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,16,balanced,0.13766400019327799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,16,balanced,0.1418293317159017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,16,power_law_1.01,0.11716480255126953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,16,power_law_1.01,0.1192255973815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,16,power_law_1.2,0.10177279710769653
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,16,power_law_1.2,0.11249920129776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,2,balanced,0.18084800243377686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,2,balanced,0.1811306675275167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,2,power_law_1.01,0.16319359540939332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,2,power_law_1.01,0.16544640064239502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,2,power_law_1.2,0.1701311945915222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,2,power_law_1.2,0.17613439559936522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,256,balanced,0.04044266790151596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,256,balanced,0.04055999964475632
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,256,power_law_1.01,0.03858560025691986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,256,power_law_1.01,0.03880319893360138
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,256,power_law_1.2,0.03814400136470795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,256,power_law_1.2,0.03857280015945434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,32,balanced,0.060032000144322716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,32,balanced,0.06286933521429698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,32,power_law_1.01,0.05555840134620667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,32,power_law_1.01,0.05870720148086548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,32,power_law_1.2,0.05199360251426697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,32,power_law_1.2,0.05384960174560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,4,balanced,0.1097920040289561
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,4,balanced,0.11084799965222676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,4,power_law_1.01,0.10029439926147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,4,power_law_1.01,0.10106879472732544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,4,power_law_1.2,0.10329600572586059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,4,power_law_1.2,0.10336639881134033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,64,balanced,0.04378133515516917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,64,balanced,0.04409599800904592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,64,power_law_1.01,0.041631999611854556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,64,power_law_1.01,0.042028799653053284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,64,power_law_1.2,0.04131839871406555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,64,power_law_1.2,0.04185599982738495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,8,balanced,0.10242666800816853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,8,balanced,0.10364266236623128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,8,power_law_1.01,0.07885439991950989
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,8,power_law_1.01,0.08145279884338379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,8,power_law_1.2,0.08278399705886841
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,1,8,power_law_1.2,0.0876800000667572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,2,1,balanced,0.2187946637471517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,2,1,balanced,0.21967466672261557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,2,1,power_law_1.01,0.19324159622192383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,2,1,power_law_1.01,0.19629440307617188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,2,1,power_law_1.2,0.19988479614257812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,4,1,balanced,0.13878933588663736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,4,1,balanced,0.13969066739082336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,4,1,power_law_1.01,0.12371200323104858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,4,1,power_law_1.01,0.12432639598846436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,4,1,power_law_1.2,0.1260480046272278
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,4,1,power_law_1.2,0.12670079469680787
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,8,1,balanced,0.10800533493359883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,8,1,balanced,0.10834133625030518
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,8,1,power_law_1.01,0.09710080027580262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,8,1,power_law_1.01,0.09815679788589478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,8,1,power_law_1.2,0.09813119769096375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,3072,1536,8,256,8,1,power_law_1.2,0.09966080188751221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,1,balanced,0.3670719861984253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,1,balanced,0.3680906693140666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,1,power_law_1.01,0.22332799434661865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,1,power_law_1.01,0.22627840042114258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,1,power_law_1.2,0.2246527910232544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,1,power_law_1.2,0.22815361022949218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,2,balanced,0.25895466407140094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,2,balanced,0.26606933275858563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,2,power_law_1.01,0.15580159425735474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,2,power_law_1.01,0.161407995223999
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,2,power_law_1.2,0.1623296022415161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,2,power_law_1.2,0.2684992074966431
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,4,balanced,0.15148267149925232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,4,balanced,0.15898666779200235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,4,power_law_1.01,0.11827839612960815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,4,power_law_1.01,0.1455615997314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,4,power_law_1.2,0.11932799816131592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,4,power_law_1.2,0.14663039445877074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,8,balanced,0.10965866843859355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,8,balanced,0.11049600442250569
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,8,power_law_1.01,0.1118783950805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,8,power_law_1.01,0.11320320367813111
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,8,power_law_1.2,0.114028799533844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,1,8,power_law_1.2,0.11526399850845337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,16,1,balanced,0.0528053343296051
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,16,1,balanced,0.053120002150535583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,16,1,power_law_1.01,0.043910399079322815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,16,1,power_law_1.01,0.044064000248909
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,16,1,power_law_1.2,0.0430976003408432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,16,1,power_law_1.2,0.04338560104370117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,2,1,balanced,0.18690667549769083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,2,1,balanced,0.19886932770411173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,2,1,power_law_1.01,0.12695679664611817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,2,1,power_law_1.01,0.1270848035812378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,2,1,power_law_1.2,0.12620160579681397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,2,1,power_law_1.2,0.12728960514068605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,32,1,balanced,0.04381866753101349
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,32,1,balanced,0.04558399816354116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,32,1,power_law_1.01,0.038201600313186646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,32,1,power_law_1.01,0.03904640078544617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,32,1,power_law_1.2,0.03824000060558319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,32,1,power_law_1.2,0.03870719969272614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,4,1,balanced,0.11159466703732808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,4,1,balanced,0.11885333061218262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,4,1,power_law_1.01,0.08050559759140015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,4,1,power_law_1.01,0.08222079873085023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,4,1,power_law_1.2,0.08015360236167908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,4,1,power_law_1.2,0.08353919982910156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,8,1,balanced,0.08086933195590973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,8,1,balanced,0.08163199822107951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,8,1,power_law_1.01,0.05958399772644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,8,1,power_law_1.01,0.05975040197372437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,8,1,power_law_1.2,0.05991680026054382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,14336,2,8,8,1,power_law_1.2,0.06032000184059143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,1,balanced,0.26600533723831177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,1,balanced,0.266975998878479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,1,power_law_1.01,0.26017920970916747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,1,power_law_1.01,0.26225919723510743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,1,power_law_1.2,0.26927359104156495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,1,power_law_1.2,0.27162880897521974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,128,balanced,0.043322667479515076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,128,balanced,0.04376000165939331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,128,power_law_1.01,0.04220159947872162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,128,power_law_1.01,0.042208001017570496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,128,power_law_1.2,0.042182400822639465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,128,power_law_1.2,0.042931199073791504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,16,balanced,0.06473066906134288
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,16,balanced,0.06621866424878438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,16,power_law_1.01,0.060710400342941284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,16,power_law_1.01,0.06576640009880066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,16,power_law_1.2,0.0623744010925293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,16,power_law_1.2,0.06903039813041686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,2,balanced,0.1402613321940104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,2,balanced,0.14141333103179932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,2,power_law_1.01,0.14139519929885863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,2,power_law_1.01,0.14663039445877074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,2,power_law_1.2,0.14527360200881959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,2,power_law_1.2,0.1497599959373474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,32,balanced,0.04809066653251648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,32,balanced,0.049039999643961586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,32,power_law_1.01,0.04550400078296661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,32,power_law_1.01,0.04650880098342895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,32,power_law_1.2,0.04472959935665131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,32,power_law_1.2,0.046188798546791074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,4,balanced,0.11154133081436157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,4,balanced,0.11752000451087952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,4,power_law_1.01,0.09587839841842652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,4,power_law_1.01,0.10191999673843384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,4,power_law_1.2,0.09407359957695008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,4,power_law_1.2,0.09573760032653808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,64,balanced,0.04502933224042257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,64,balanced,0.045850664377212524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,64,power_law_1.01,0.042508798837661746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,64,power_law_1.01,0.04296959936618805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,64,power_law_1.2,0.04348799884319306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,64,power_law_1.2,0.04371840059757233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,8,balanced,0.17283733685811362
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,8,balanced,0.1746506690979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,8,power_law_1.01,0.12965760231018067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,8,power_law_1.01,0.13775999546051027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,8,power_law_1.2,0.12079360485076904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,1,8,power_law_1.2,0.13701119422912597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,2,1,balanced,0.16967999935150146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,2,1,balanced,0.17139732837677002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,2,1,power_law_1.01,0.160806405544281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,2,1,power_law_1.01,0.16225279569625856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,2,1,power_law_1.2,0.16354559659957885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,2,1,power_law_1.2,0.16449919939041138
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,4,1,balanced,0.11519466837247212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,4,1,balanced,0.11547733346621196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,4,1,power_law_1.01,0.10601600408554077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,4,1,power_law_1.01,0.10695680379867553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,4,1,power_law_1.2,0.10613759756088256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,4,1,power_law_1.2,0.10854400396347046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,8,1,balanced,0.09062400460243225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,8,1,balanced,0.09222400188446045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,8,1,power_law_1.01,0.08386560082435608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,8,1,power_law_1.01,0.08417919874191285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,8,1,power_law_1.2,0.08382080197334289
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,4096,1536,8,128,8,1,power_law_1.2,0.08442879915237426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,1,balanced,0.531823992729187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,1,balanced,0.5329386790593466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,1,power_law_1.01,0.37010560035705564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,1,power_law_1.01,0.40381441116333006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,1,power_law_1.2,0.38996479511260984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,1,power_law_1.2,0.39530239105224607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,2,balanced,0.3332693378130595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,2,balanced,0.33638401826222736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,2,power_law_1.01,0.19953919649124147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,2,power_law_1.01,0.22163839340209962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,2,power_law_1.2,0.2032831907272339
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,2,power_law_1.2,0.2986176013946533
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,4,balanced,0.19037866592407227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,4,balanced,0.19166932503382364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,4,power_law_1.01,0.16587519645690918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,4,power_law_1.01,0.20459520816802979
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,4,power_law_1.2,0.1387712001800537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,4,power_law_1.2,0.15618560314178467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,8,balanced,0.12603200475374857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,8,balanced,0.12960533301035562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,8,power_law_1.01,0.1440127968788147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,8,power_law_1.01,0.14419840574264525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,8,power_law_1.2,0.1416767954826355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,1,8,power_law_1.2,0.14484479427337646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,16,1,balanced,0.06970666845639546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,16,1,balanced,0.07002666592597961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,16,1,power_law_1.01,0.058233600854873654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,16,1,power_law_1.01,0.058361601829528806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,16,1,power_law_1.2,0.05914239883422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,16,1,power_law_1.2,0.05989120006561279
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,2,1,balanced,0.26179732879002887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,2,1,balanced,0.26254934072494507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,2,1,power_law_1.01,0.18829439878463744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,2,1,power_law_1.01,0.19032959938049315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,2,1,power_law_1.2,0.18466559648513795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,2,1,power_law_1.2,0.1894144058227539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,32,1,balanced,0.04986133178075155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,32,1,balanced,0.050714666644732155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,32,1,power_law_1.01,0.04248960018157959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,32,1,power_law_1.01,0.04353919923305512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,32,1,power_law_1.2,0.04338560104370117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,32,1,power_law_1.2,0.04376319944858551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,4,1,balanced,0.15190399686495462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,4,1,balanced,0.1521013379096985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,4,1,power_law_1.01,0.11208319664001465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,4,1,power_law_1.01,0.11384320259094238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,4,1,power_law_1.2,0.1131327986717224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,4,1,power_law_1.2,0.11549439430236816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,8,1,balanced,0.09743466973304749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,8,1,balanced,0.099589337905248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,8,1,power_law_1.01,0.07697920203208923
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,8,1,power_law_1.01,0.07868160009384155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,8,1,power_law_1.2,0.0762112021446228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,16384,2,8,8,1,power_law_1.2,0.07948799729347229
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,1,balanced,0.8910773595174154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,1,balanced,0.8955252965291342
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,1,power_law_1.01,0.8208448410034179
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,1,power_law_1.01,0.830303955078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,1,power_law_1.2,0.8509440422058105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,1,power_law_1.2,0.8655872344970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,128,balanced,0.05409066875775655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,128,balanced,0.054154664278030396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,128,power_law_1.01,0.04993920028209686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,128,power_law_1.01,0.05066239833831787
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,128,power_law_1.2,0.048895999789237976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,128,power_law_1.2,0.050329601764678954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,16,balanced,0.27592533826828003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,16,balanced,0.28082666794459027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,16,power_law_1.01,0.2106623888015747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,16,power_law_1.01,0.2136320114135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,16,power_law_1.2,0.20127999782562256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,16,power_law_1.2,0.2285248041152954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,2,balanced,0.42289066314697266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,2,balanced,0.42393068472544354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,2,power_law_1.01,0.3876415967941284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,2,power_law_1.01,0.40458879470825193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,2,power_law_1.2,0.40286078453063967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,2,power_law_1.2,0.41561598777770997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,256,balanced,0.049285332361857094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,256,balanced,0.04994133114814758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,256,power_law_1.01,0.04748800098896026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,256,power_law_1.01,0.047814399003982544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,256,power_law_1.2,0.047244799137115476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,256,power_law_1.2,0.047295999526977536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,32,balanced,0.12550399700800577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,32,balanced,0.12550933162371317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,32,power_law_1.01,0.09808639883995056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,32,power_law_1.01,0.10895359516143799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,32,power_law_1.2,0.09190400242805481
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,32,power_law_1.2,0.10605440139770508
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,4,balanced,0.23506667216618857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,4,balanced,0.23690134286880493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,4,power_law_1.01,0.21217920780181884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,4,power_law_1.01,0.21502718925476075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,4,power_law_1.2,0.2223871946334839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,4,power_law_1.2,0.2244096040725708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,64,balanced,0.06809600194295247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,64,balanced,0.06876799960931142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,64,power_law_1.01,0.06419199705123901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,64,power_law_1.01,0.06479359865188598
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,64,power_law_1.2,0.062105602025985716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,64,power_law_1.2,0.06291199922561645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,8,balanced,0.18968000014623007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,8,balanced,0.1934453248977661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,8,power_law_1.01,0.14353920221328736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,8,power_law_1.01,0.14721920490264892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,8,power_law_1.2,0.15092480182647705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,1,8,power_law_1.2,0.15095679759979247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,16,1,balanced,0.1581546664237976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,16,1,balanced,0.15851733088493347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,16,1,power_law_1.01,0.14464000463485718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,16,1,power_law_1.01,0.14655359983444213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,16,1,power_law_1.2,0.14710400104522706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,16,1,power_law_1.2,0.1483456015586853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,2,1,balanced,0.4723573525746663
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,2,1,balanced,0.47335998217264813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,2,1,power_law_1.01,0.4302080154418945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,2,1,power_law_1.01,0.4312255859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,2,1,power_law_1.2,0.44211840629577637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,2,1,power_law_1.2,0.44294400215148927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,32,1,balanced,0.14078399538993835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,32,1,balanced,0.14099199573198953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,32,1,power_law_1.01,0.12962559461593628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,32,1,power_law_1.01,0.1303104043006897
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,32,1,power_law_1.2,0.13097599744796753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,32,1,power_law_1.2,0.1317952036857605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,4,1,balanced,0.27669332424799603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,4,1,balanced,0.27938665946324664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,4,1,power_law_1.01,0.2482304096221924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,4,1,power_law_1.01,0.25404160022735595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,4,1,power_law_1.2,0.25458559989929197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,4,1,power_law_1.2,0.2559679985046387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,8,1,balanced,0.19367466370264688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,8,1,balanced,0.19431465864181519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,8,1,power_law_1.01,0.17623039484024047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,8,1,power_law_1.01,0.17643519639968872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,8,1,power_law_1.2,0.17905919551849364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2048,8,256,8,1,power_law_1.2,0.17906559705734254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,1,balanced,0.7152640024820963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,1,balanced,0.717087984085083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,1,power_law_1.01,0.8438912391662597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,1,power_law_1.01,0.8558208465576171
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,1,power_law_1.2,0.8740608215332031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,1,power_law_1.2,0.875551986694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,16,balanced,0.17829867204030356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,16,balanced,0.1789919932683309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,16,power_law_1.01,0.15213439464569092
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,16,power_law_1.01,0.15386879444122314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,16,power_law_1.2,0.12978559732437134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,16,power_law_1.2,0.15982719659805297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,2,balanced,0.34270934263865155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,2,balanced,0.34284265836079914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,2,power_law_1.01,0.35812480449676515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,2,power_law_1.01,0.3689215898513794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,2,power_law_1.2,0.38064000606536863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,2,power_law_1.2,0.380729603767395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,32,balanced,0.09495466947555542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,32,balanced,0.0951039989789327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,32,power_law_1.01,0.08217599987983704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,32,power_law_1.01,0.08676480054855347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,32,power_law_1.2,0.08443520069122315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,32,power_law_1.2,0.08557440042495727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,4,balanced,0.19530133406321207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,4,balanced,0.19547200202941895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,4,power_law_1.01,0.19482239484786987
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,4,power_law_1.01,0.19596799612045288
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,4,power_law_1.2,0.19680639505386352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,4,power_law_1.2,0.20556159019470216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,8,balanced,0.1399893363316854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,8,balanced,0.14070933063824972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,8,power_law_1.01,0.1288831949234009
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,8,power_law_1.01,0.12931840419769286
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,8,power_law_1.2,0.13366400003433226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,1,8,power_law_1.2,0.13436800241470337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,2,1,balanced,0.39654401938120526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,2,1,balanced,0.3988853295644124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,2,1,power_law_1.01,0.4620800018310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,2,1,power_law_1.01,0.4685056209564209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,2,1,power_law_1.2,0.47925119400024413
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,2,1,power_law_1.2,0.4796288013458252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,4,1,balanced,0.2553706765174866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,4,1,balanced,0.25619733333587646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,4,1,power_law_1.01,0.28765439987182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,4,1,power_law_1.01,0.2958208084106445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,4,1,power_law_1.2,0.2925503969192505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,4,1,power_law_1.2,0.2951296091079712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,8,1,balanced,0.15958399573961893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,8,1,balanced,0.15993066628774008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,8,1,power_law_1.01,0.17255040407180786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,8,1,power_law_1.01,0.1737280011177063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,8,1,power_law_1.2,0.17569279670715332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,6144,2560,8,160,8,1,power_law_1.2,0.17679359912872314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,1,balanced,1.0418879985809326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,1,balanced,1.0491092999776204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,1,power_law_1.01,0.955833625793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,1,power_law_1.01,0.9581695556640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,1,power_law_1.2,1.0131839752197265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,1,power_law_1.2,1.0237695693969726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,128,balanced,0.05385600030422211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,128,balanced,0.0540533314148585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,128,power_law_1.01,0.051641601324081424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,128,power_law_1.01,0.052172797918319705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,128,power_law_1.2,0.05237759947776795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,128,power_law_1.2,0.05322880148887634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,16,balanced,0.2823839982350667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,16,balanced,0.29436800877253216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,16,power_law_1.01,0.20039680004119872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,16,power_law_1.01,0.21029119491577147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,16,power_law_1.2,0.17640960216522217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,16,power_law_1.2,0.2121216058731079
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,2,balanced,0.4853866497675578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,2,balanced,0.48605867226918537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,2,power_law_1.01,0.44449920654296876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,2,power_law_1.01,0.4632256031036377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,2,power_law_1.2,0.4636223793029785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,2,power_law_1.2,0.4699456214904785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,256,balanced,0.05173333485921224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,256,balanced,0.05211733281612396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,256,power_law_1.01,0.04956159889698029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,256,power_law_1.01,0.049728000164031984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,256,power_law_1.2,0.04997760057449341
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,256,power_law_1.2,0.05012480020523071
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,32,balanced,0.1169653336207072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,32,balanced,0.12059733271598816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,32,power_law_1.01,0.10007679462432861
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,32,power_law_1.01,0.10119680166244507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,32,power_law_1.2,0.08969600200653076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,32,power_law_1.2,0.09341440200805665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,4,balanced,0.2691466609636943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,4,balanced,0.2705333431561788
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,4,power_law_1.01,0.2522495985031128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,4,power_law_1.01,0.2528000116348267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,4,power_law_1.2,0.25692799091339114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,4,power_law_1.2,0.2648767948150635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,64,balanced,0.06860800087451935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,64,balanced,0.0688213308652242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,64,power_law_1.01,0.061875200271606444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,64,power_law_1.01,0.0630400002002716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,64,power_law_1.2,0.062118399143219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,64,power_law_1.2,0.06301440000534057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,8,balanced,0.20860799153645834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,8,balanced,0.209279994169871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,8,power_law_1.01,0.16351360082626343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,8,power_law_1.01,0.16378240585327147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,8,power_law_1.2,0.16995840072631835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,1,8,power_law_1.2,0.1735360026359558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,16,1,balanced,0.17857599258422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,16,1,balanced,0.17921600739161173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,16,1,power_law_1.01,0.164300799369812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,16,1,power_law_1.01,0.16677759885787963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,16,1,power_law_1.2,0.1671872019767761
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,16,1,power_law_1.2,0.1672320008277893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,2,1,balanced,0.5490346749623617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,2,1,balanced,0.5500426689783732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,2,1,power_law_1.01,0.5007232189178467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,2,1,power_law_1.01,0.5013504028320312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,2,1,power_law_1.2,0.5181824207305908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,2,1,power_law_1.2,0.5201727867126464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,32,1,balanced,0.15890666842460632
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,32,1,balanced,0.15896532932917276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,32,1,power_law_1.01,0.14512640237808228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,32,1,power_law_1.01,0.14617600440979003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,32,1,power_law_1.2,0.1489408016204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,32,1,power_law_1.2,0.15077760219573974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,4,1,balanced,0.31730133295059204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,4,1,balanced,0.32316267490386963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,4,1,power_law_1.01,0.2868736028671265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,4,1,power_law_1.01,0.28869760036468506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,4,1,power_law_1.2,0.2936896085739136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,4,1,power_law_1.2,0.2957184076309204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,8,1,balanced,0.22025066614151
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,8,1,balanced,0.22114133834838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,8,1,power_law_1.01,0.20021119117736816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,8,1,power_law_1.01,0.2011199951171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,8,1,power_law_1.2,0.20331521034240724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,256,8,1,power_law_1.2,0.204038405418396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,1,balanced,1.3557920455932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,1,balanced,1.357210636138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,1,power_law_1.01,1.2063103675842286
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,1,power_law_1.01,1.2111295700073241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,1,power_law_1.2,1.2044608116149902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,1,power_law_1.2,1.2056063652038573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,128,balanced,0.05682133138179779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,128,balanced,0.06009600063165029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,128,power_law_1.01,0.057708799839019775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,128,power_law_1.01,0.05788159966468811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,128,power_law_1.2,0.05763840079307556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,128,power_law_1.2,0.05782399773597717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,16,balanced,0.16716800133387247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,16,balanced,0.1673706571261088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,16,power_law_1.01,0.12711039781570435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,16,power_law_1.01,0.13649280071258546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,16,power_law_1.2,0.12862080335617065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,16,power_law_1.2,0.13942400217056275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,2,balanced,0.7012480099995931
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,2,balanced,0.7023946444193522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,2,power_law_1.01,0.6288447856903077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,2,power_law_1.01,0.663372802734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,2,power_law_1.2,0.6392127990722656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,2,power_law_1.2,0.6635519981384277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,32,balanced,0.2204586664835612
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,32,balanced,0.22088533639907837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,32,power_law_1.01,0.17768319845199584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,32,power_law_1.01,0.18253439664840698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,32,power_law_1.2,0.16470400094985962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,32,power_law_1.2,0.17212159633636476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,4,balanced,0.37247467041015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,4,balanced,0.3731573422749837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,4,power_law_1.01,0.30977280139923097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,4,power_law_1.01,0.32241919040679934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,4,power_law_1.2,0.3297919988632202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,4,power_law_1.2,0.3435967922210693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,64,balanced,0.08410666386286418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,64,balanced,0.08524800340334575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,64,power_law_1.01,0.07739520072937012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,64,power_law_1.01,0.08081279993057251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,64,power_law_1.2,0.07938560247421264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,64,power_law_1.2,0.08001279830932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,8,balanced,0.21449067195256552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,8,balanced,0.2146880030632019
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,8,power_law_1.01,0.18521599769592284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,8,power_law_1.01,0.19073280096054077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,8,power_law_1.2,0.18516479730606078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,1,8,power_law_1.2,0.20273919105529786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,16,1,balanced,0.18145600954691568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,16,1,balanced,0.1829973260561625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,16,1,power_law_1.01,0.18825600147247315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,16,1,power_law_1.01,0.18893439769744874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,16,1,power_law_1.2,0.1885823965072632
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,16,1,power_law_1.2,0.1888383984565735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,2,1,balanced,0.7100266615549723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,2,1,balanced,0.7102719942728678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,2,1,power_law_1.01,0.6261248111724853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,2,1,power_law_1.01,0.6291135787963867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,2,1,power_law_1.2,0.6189375877380371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,2,1,power_law_1.2,0.6365119934082031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,32,1,balanced,0.15397866566975912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,32,1,balanced,0.1542080044746399
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,32,1,power_law_1.01,0.16455680131912231
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,32,1,power_law_1.01,0.16498559713363647
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,32,1,power_law_1.2,0.16431360244750975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,32,1,power_law_1.2,0.16556799411773682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,4,1,balanced,0.39052800337473553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,4,1,balanced,0.3906720081965129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,4,1,power_law_1.01,0.35345280170440674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,4,1,power_law_1.01,0.35369598865509033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,4,1,power_law_1.2,0.3567744016647339
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,4,1,power_law_1.2,0.35829761028289797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,8,1,balanced,0.24081067244211832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,8,1,balanced,0.24182933568954468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,8,1,power_law_1.01,0.2334656000137329
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,8,1,power_law_1.01,0.23745920658111572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,8,1,power_law_1.2,0.23743999004364014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,320,7168,2048,8,384,8,1,power_law_1.2,0.24094080924987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,1,balanced,0.09866666793823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,1,balanced,0.09900800387064616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,1,power_law_1.01,0.09995520114898682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,1,power_law_1.01,0.1007423996925354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,1,power_law_1.2,0.10207359790802002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,1,power_law_1.2,0.10258560180664063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,128,balanced,0.03716800113519033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,128,balanced,0.03745600084463755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,128,power_law_1.01,0.035699200630187986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,128,power_law_1.01,0.03691520094871521
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,128,power_law_1.2,0.03592320084571839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,128,power_law_1.2,0.03612160086631775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,16,balanced,0.03941866755485535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,16,balanced,0.039520000418027244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,16,power_law_1.01,0.03802880048751831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,16,power_law_1.01,0.03825919926166534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,16,power_law_1.2,0.03863680064678192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,16,power_law_1.2,0.03869439959526062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,2,balanced,0.06222933530807495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,2,balanced,0.06234133243560791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,2,power_law_1.01,0.06321920156478882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,2,power_law_1.01,0.06529279947280883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,2,power_law_1.2,0.06603519916534424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,2,power_law_1.2,0.06655359864234925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,32,balanced,0.039493332306543984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,32,balanced,0.039642666776975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,32,power_law_1.01,0.036985599994659425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,32,power_law_1.01,0.03754880130290985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,32,power_law_1.2,0.03619840145111084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,32,power_law_1.2,0.036556801199913024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,4,balanced,0.049327999353408813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,4,balanced,0.051728000243504844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,4,power_law_1.01,0.048019200563430786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,4,power_law_1.01,0.049184000492095946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,4,power_law_1.2,0.04922240078449249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,4,power_law_1.2,0.050432002544403075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,64,balanced,0.03756800045569738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,64,balanced,0.03758399933576584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,64,power_law_1.01,0.036134400963783266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,64,power_law_1.01,0.03704319894313812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,64,power_law_1.2,0.03592320084571839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,64,power_law_1.2,0.036339199542999266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,8,balanced,0.05713599920272827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,8,balanced,0.062037333846092224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,8,power_law_1.01,0.04839679896831513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,8,power_law_1.01,0.05092480182647705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,8,power_law_1.2,0.05056639909744263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,1,8,power_law_1.2,0.05551999807357788
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,2,1,balanced,0.07127999762694041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,2,1,balanced,0.07202133536338806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,2,1,power_law_1.01,0.07063040137290955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,2,1,power_law_1.01,0.07089920043945312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,2,1,power_law_1.2,0.07043200135231018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,2,1,power_law_1.2,0.07247999906539918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,4,1,balanced,0.05850133299827576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,4,1,balanced,0.05997333427270254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,4,1,power_law_1.01,0.056959998607635495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,4,1,power_law_1.01,0.05815039873123169
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,4,1,power_law_1.2,0.05922560095787048
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,2048,768,8,128,4,1,power_law_1.2,0.05932160019874573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,1,balanced,0.35678398609161377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,1,balanced,0.3591093222300212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,1,power_law_1.01,0.34739840030670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,1,power_law_1.01,0.3499520063400269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,1,power_law_1.2,0.35697920322418214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,1,power_law_1.2,0.37073280811309817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,128,balanced,0.04212800165017446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,128,balanced,0.042410666743914284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,128,power_law_1.01,0.03968639969825745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,128,power_law_1.01,0.03978239893913269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,128,power_law_1.2,0.038848000764846805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,128,power_law_1.2,0.03957119882106781
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,16,balanced,0.14541332920392355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,16,balanced,0.15152000387509665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,16,power_law_1.01,0.09058560132980346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,16,power_law_1.01,0.11715199947357177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,16,power_law_1.2,0.11503360271453858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,16,power_law_1.2,0.12136319875717164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,2,balanced,0.1811466614405314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,2,balanced,0.18189332882563272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,2,power_law_1.01,0.17011200189590453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,2,power_law_1.01,0.1701311945915222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,2,power_law_1.2,0.17736320495605468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,2,power_law_1.2,0.1781056046485901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,256,balanced,0.04121600091457367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,256,balanced,0.04159466673930486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,256,power_law_1.01,0.03868800103664398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,256,power_law_1.01,0.03896960020065308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,256,power_law_1.2,0.03813120126724243
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,256,power_law_1.2,0.03912320137023926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,32,balanced,0.058575997749964394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,32,balanced,0.06006933252016703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,32,power_law_1.01,0.05754240155220032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,32,power_law_1.01,0.0607807993888855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,32,power_law_1.2,0.05482879877090454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,32,power_law_1.2,0.05628799796104431
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,4,balanced,0.11010666688283284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,4,balanced,0.11075199643770854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,4,power_law_1.01,0.10241919755935669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,4,power_law_1.01,0.10419199466705323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,4,power_law_1.2,0.10618239641189575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,64,balanced,0.045696000258127846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,64,balanced,0.04784533381462097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,64,power_law_1.01,0.04327679872512817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,64,power_law_1.01,0.0451200008392334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,64,power_law_1.2,0.04154880046844482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,64,power_law_1.2,0.0416128009557724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,8,balanced,0.09380267063776652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,8,balanced,0.09963732957839966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,8,power_law_1.01,0.07681279778480529
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,8,power_law_1.01,0.07998719811439514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,8,power_law_1.2,0.07869439721107482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,1,8,power_law_1.2,0.07882879972457886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,2,1,balanced,0.21925334135691324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,2,1,balanced,0.2196000019709269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,2,1,power_law_1.01,0.21281919479370118
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,2,1,power_law_1.01,0.21290879249572753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,2,1,power_law_1.2,0.21909759044647217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,2,1,power_law_1.2,0.2216320037841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,4,1,balanced,0.13894933462142944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,4,1,balanced,0.1404800017674764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,4,1,power_law_1.01,0.13110400438308717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,4,1,power_law_1.01,0.13351039886474608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,4,1,power_law_1.2,0.13560960292816163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,4,1,power_law_1.2,0.13691519498825072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,8,1,balanced,0.10760533809661865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,8,1,balanced,0.1090826690196991
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,8,1,power_law_1.01,0.10361599922180176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,8,1,power_law_1.01,0.10582400560379028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,8,1,power_law_1.2,0.10492160320281982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,3072,1536,8,256,8,1,power_law_1.2,0.10524799823760986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,1,balanced,0.29761600494384766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,1,balanced,0.2988053361574809
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,1,power_law_1.01,0.23752961158752442
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,1,power_law_1.01,0.24387838840484619
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,1,power_law_1.2,0.23347198963165283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,1,power_law_1.2,0.23571839332580566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,2,balanced,0.18615466356277466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,2,balanced,0.18714666366577148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,2,power_law_1.01,0.14464000463485718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,2,power_law_1.01,0.20723841190338135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,2,power_law_1.2,0.14247039556503296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,2,power_law_1.2,0.15966720581054689
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,4,balanced,0.11580800016721089
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,4,balanced,0.11620799700419109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,4,power_law_1.01,0.1107200026512146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,4,power_law_1.01,0.1331071972846985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,4,power_law_1.2,0.10170880556106568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,4,power_law_1.2,0.12222720384597778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,8,balanced,0.06651733318964641
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,8,balanced,0.06671466430028279
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,8,power_law_1.01,0.07996799945831298
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,8,power_law_1.01,0.08062719702720642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,8,power_law_1.2,0.08047360181808472
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,1,8,power_law_1.2,0.08569599986076355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,16,1,balanced,0.050426666935284935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,16,1,balanced,0.052186667919158936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,16,1,power_law_1.01,0.04583039879798889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,16,1,power_law_1.01,0.047225600481033324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,16,1,power_law_1.2,0.04353919923305512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,16,1,power_law_1.2,0.047712001204490664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,2,1,balanced,0.16268266240755716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,2,1,balanced,0.16340800126393637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,2,1,power_law_1.01,0.13371520042419432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,2,1,power_law_1.01,0.13556480407714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,2,1,power_law_1.2,0.13454079627990723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,2,1,power_law_1.2,0.14116480350494384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,32,1,balanced,0.04171200096607208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,32,1,balanced,0.04342933495839437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,32,1,power_law_1.01,0.039904001355171206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,32,1,power_law_1.01,0.04074240028858185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,32,1,power_law_1.2,0.040038400888442995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,32,1,power_law_1.2,0.04059520065784454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,4,1,balanced,0.1020960013071696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,4,1,balanced,0.10236266255378723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,4,1,power_law_1.01,0.08505600094795226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,4,1,power_law_1.01,0.09098240137100219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,4,1,power_law_1.2,0.08572160005569458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,4,1,power_law_1.2,0.08934400081634522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,8,1,balanced,0.07308800021807353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,8,1,balanced,0.07314666608969371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,8,1,power_law_1.01,0.061926400661468504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,8,1,power_law_1.01,0.06474879980087281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,8,1,power_law_1.2,0.06218879818916321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,14336,2,8,8,1,power_law_1.2,0.06408320069313049
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,1,balanced,0.2669066588083903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,1,balanced,0.2671893239021301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,1,power_law_1.01,0.2794624090194702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,1,power_law_1.01,0.2805952072143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,1,power_law_1.2,0.28933761119842527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,1,power_law_1.2,0.2916287899017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,128,balanced,0.04386133452256521
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,128,balanced,0.04418133199214935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,128,power_law_1.01,0.04317440092563629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,128,power_law_1.01,0.04323840141296387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,128,power_law_1.2,0.043110400438308716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,128,power_law_1.2,0.043219199776649474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,16,balanced,0.065461332599322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,16,balanced,0.0654720018307368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,16,power_law_1.01,0.06332799792289734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,16,power_law_1.01,0.06509439945220948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,16,power_law_1.2,0.06542720198631287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,16,power_law_1.2,0.06711040139198303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,2,balanced,0.1399999956289927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,2,balanced,0.1418186624844869
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,2,power_law_1.01,0.1481727957725525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,2,power_law_1.01,0.1508031964302063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,2,power_law_1.2,0.1519551992416382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,2,power_law_1.2,0.1537984013557434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,32,balanced,0.04833599925041199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,32,balanced,0.048512001832326256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,32,power_law_1.01,0.04524160027503967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,32,power_law_1.01,0.04658559858798981
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,32,power_law_1.2,0.04730879962444305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,32,power_law_1.2,0.049267199635505673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,4,balanced,0.1083573301633199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,4,balanced,0.10969600081443787
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,4,power_law_1.01,0.10003199577331542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,4,power_law_1.01,0.10112639665603637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,4,power_law_1.2,0.09939839839935302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,4,power_law_1.2,0.10076800584793091
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,64,balanced,0.04598399996757507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,64,balanced,0.04615999758243561
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,64,power_law_1.01,0.04316799938678741
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,64,power_law_1.01,0.04403199851512909
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,64,power_law_1.2,0.04344319999217987
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,64,power_law_1.2,0.04412800073623657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,8,balanced,0.15296000242233276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,8,balanced,0.1646986703077952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,8,power_law_1.01,0.11266560554504394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,8,power_law_1.01,0.1368831992149353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,8,power_law_1.2,0.10221439599990845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,1,8,power_law_1.2,0.10746239423751831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,2,1,balanced,0.169706662495931
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,2,1,balanced,0.17085866133371988
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,2,1,power_law_1.01,0.17128959894180298
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,2,1,power_law_1.01,0.17357439994812013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,2,1,power_law_1.2,0.1775488018989563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,2,1,power_law_1.2,0.17760000228881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,4,1,balanced,0.11168000102043152
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,4,1,balanced,0.11409599582354228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,4,1,power_law_1.01,0.11168639659881592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,4,1,power_law_1.01,0.11259520053863525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,4,1,power_law_1.2,0.11388800144195557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,4,1,power_law_1.2,0.11550079584121704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,8,1,balanced,0.08967999617258708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,8,1,balanced,0.09197333455085754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,8,1,power_law_1.01,0.08852480053901672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,8,1,power_law_1.01,0.08877440094947815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,8,1,power_law_1.2,0.08973439931869506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,4096,1536,8,128,8,1,power_law_1.2,0.08994560241699219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,1,balanced,0.4641866683959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,1,balanced,0.4662986596425374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,1,power_law_1.01,0.4443840026855469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,1,power_law_1.01,0.4463359832763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,1,power_law_1.2,0.4421504020690918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,1,power_law_1.2,0.44306559562683107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,2,balanced,0.24341867367426553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,2,balanced,0.2441813349723816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,2,power_law_1.01,0.20558080673217774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,2,power_law_1.01,0.21045119762420655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,2,power_law_1.2,0.19867520332336425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,2,power_law_1.2,0.23931519985198973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,4,balanced,0.1301706631978353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,4,balanced,0.1318880021572113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,4,power_law_1.01,0.1675328016281128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,4,power_law_1.01,0.1882367968559265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,4,power_law_1.2,0.14244480133056642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,4,power_law_1.2,0.15475200414657592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,8,balanced,0.0803466687599818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,8,balanced,0.08040000001589458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,8,power_law_1.01,0.10643839836120605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,8,power_law_1.01,0.11413760185241699
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,8,power_law_1.2,0.11026560068130493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,1,8,power_law_1.2,0.11323519945144653
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,16,1,balanced,0.06411733229955037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,16,1,balanced,0.06598933537801106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,16,1,power_law_1.01,0.06032000184059143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,16,1,power_law_1.01,0.06056960225105286
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,16,1,power_law_1.2,0.060224002599716185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,16,1,power_law_1.2,0.06098560094833374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,2,1,balanced,0.2192373275756836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,2,1,balanced,0.21978133916854858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,2,1,power_law_1.01,0.19530880451202393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,2,1,power_law_1.01,0.20424959659576417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,2,1,power_law_1.2,0.19545600414276124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,2,1,power_law_1.2,0.19693440198898315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,32,1,balanced,0.04797866443792979
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,32,1,balanced,0.049925332268079124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,32,1,power_law_1.01,0.04529280066490173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,32,1,power_law_1.01,0.046035200357437134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,32,1,power_law_1.2,0.04500479996204376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,32,1,power_law_1.2,0.04506239891052246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,4,1,balanced,0.13129599889119467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,4,1,balanced,0.13160000244776407
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,4,1,power_law_1.01,0.11966079473495483
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,4,1,power_law_1.01,0.12221440076828002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,4,1,power_law_1.2,0.1220479965209961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,4,1,power_law_1.2,0.12376960515975952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,8,1,balanced,0.0863146682580312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,8,1,balanced,0.0865760048230489
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,8,1,power_law_1.01,0.08085119724273682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,8,1,power_law_1.01,0.08379520177841186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,8,1,power_law_1.2,0.0803391993045807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,16384,2,8,8,1,power_law_1.2,0.08120959997177124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,1,balanced,0.891103982925415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,1,balanced,0.8955787022908529
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,1,power_law_1.01,0.8919296264648438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,1,power_law_1.01,0.8969856262207031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,1,power_law_1.2,0.9281920433044434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,1,power_law_1.2,0.9386560440063476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,128,balanced,0.04985600213209788
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,128,balanced,0.05173333485921224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,128,power_law_1.01,0.04927999973297119
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,128,power_law_1.01,0.0497408002614975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,128,power_law_1.2,0.04871039986610413
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,128,power_law_1.2,0.04912639856338501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,16,balanced,0.2160266637802124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,16,balanced,0.2281493345896403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,16,power_law_1.01,0.1727679967880249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,16,power_law_1.01,0.17641600370407104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,16,power_law_1.2,0.14955519437789916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,16,power_law_1.2,0.15175039768218995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,2,balanced,0.42369067668914795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,2,balanced,0.42388800779978436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,2,power_law_1.01,0.40567679405212403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,2,power_law_1.01,0.4134399890899658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,2,power_law_1.2,0.41187200546264646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,2,power_law_1.2,0.4154496192932129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,256,balanced,0.04974933465321859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,256,balanced,0.05004266897837321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,256,power_law_1.01,0.04790399968624115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,256,power_law_1.01,0.048198398947715757
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,256,power_law_1.2,0.04766719937324524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,256,power_law_1.2,0.047712001204490664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,32,balanced,0.08227199812730153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,32,balanced,0.08454933762550354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,32,power_law_1.01,0.07806079983711242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,32,power_law_1.01,0.07864320278167725
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,32,power_law_1.2,0.07800319790840149
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,32,power_law_1.2,0.07946239709854126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,4,balanced,0.23676800727844238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,4,balanced,0.237664004166921
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,4,power_law_1.01,0.2186431884765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,4,power_law_1.01,0.22617599964141846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,4,power_law_1.2,0.22958719730377197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,4,power_law_1.2,0.23130240440368652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,64,balanced,0.061018665631612144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,64,balanced,0.06286400059858958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,64,power_law_1.01,0.056460797786712646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,64,power_law_1.01,0.058508801460266116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,64,power_law_1.2,0.05681920051574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,64,power_law_1.2,0.05722879767417908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,8,balanced,0.1787946621576945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,8,balanced,0.18073066075642905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,8,power_law_1.01,0.14234880208969117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,8,power_law_1.01,0.14854400157928466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,8,power_law_1.2,0.1497663974761963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,1,8,power_law_1.2,0.15140479803085327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,16,1,balanced,0.16179733475049338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,16,1,balanced,0.16184533635775247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,16,1,power_law_1.01,0.15573760271072387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,16,1,power_law_1.01,0.15777280330657958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,16,1,power_law_1.2,0.16075520515441893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,16,1,power_law_1.2,0.16083199977874757
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,2,1,balanced,0.4732106526692708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,2,1,balanced,0.4740746815999349
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,2,1,power_law_1.01,0.4576831817626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,2,1,power_law_1.01,0.4628159999847412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,2,1,power_law_1.2,0.4723775863647461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,2,1,power_law_1.2,0.48583040237426756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,32,1,balanced,0.1439306636651357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,32,1,balanced,0.14412267009417215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,32,1,power_law_1.01,0.1418303966522217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,32,1,power_law_1.01,0.1419584035873413
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,32,1,power_law_1.2,0.1418303966522217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,32,1,power_law_1.2,0.1427135944366455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,4,1,balanced,0.2796960075696309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,4,1,balanced,0.2807199954986572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,4,1,power_law_1.01,0.270086407661438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,4,1,power_law_1.01,0.27571840286254884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,4,1,power_law_1.2,0.2777024030685425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,4,1,power_law_1.2,0.28107519149780275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,8,1,balanced,0.19567465782165527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,8,1,balanced,0.1971893310546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,8,1,power_law_1.01,0.187391996383667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,8,1,power_law_1.01,0.18812799453735352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,8,1,power_law_1.2,0.19322880506515502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2048,8,256,8,1,power_law_1.2,0.1940160036087036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,1,balanced,0.7290346622467041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,1,balanced,0.7310880025227865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,1,power_law_1.01,0.7204160213470459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,1,power_law_1.01,0.7235263824462891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,1,power_law_1.2,0.7467072010040283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,1,power_law_1.2,0.7561855792999268
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,16,balanced,0.1239306628704071
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,16,balanced,0.13075733184814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,16,power_law_1.01,0.09763839840888977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,16,power_law_1.01,0.09870079755783082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,16,power_law_1.2,0.1184831976890564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,16,power_law_1.2,0.13200639486312865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,2,balanced,0.3449866771697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,2,balanced,0.3463946580886841
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,2,power_law_1.01,0.3487168073654175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,2,power_law_1.01,0.3560447931289673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,2,power_law_1.2,0.36222081184387206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,2,power_law_1.2,0.3659712076187134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,32,balanced,0.07617599765459697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,32,balanced,0.07981866598129272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,32,power_law_1.01,0.07146239876747132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,32,power_law_1.01,0.07319039702415467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,32,power_law_1.2,0.07281280159950257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,32,power_law_1.2,0.07909119725227357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,4,balanced,0.25353066126505536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,4,balanced,0.2537173430124919
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,4,power_law_1.01,0.20609281063079835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,4,power_law_1.01,0.21009280681610107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,4,power_law_1.2,0.2132159948348999
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,4,power_law_1.2,0.21426560878753662
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,8,balanced,0.32703999678293866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,8,balanced,0.33418134848276776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,8,power_law_1.01,0.2066175937652588
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,8,power_law_1.01,0.24289920330047607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,8,power_law_1.2,0.21087999343872071
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,1,8,power_law_1.2,0.2544895887374878
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,2,1,balanced,0.40565868218739826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,2,1,balanced,0.40669866402943927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,2,1,power_law_1.01,0.3916991949081421
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,2,1,power_law_1.01,0.3961535930633545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,2,1,power_law_1.2,0.40698881149291993
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,2,1,power_law_1.2,0.4131328105926514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,4,1,balanced,0.2592693368593852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,4,1,balanced,0.2604479988416036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,4,1,power_law_1.01,0.24176640510559083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,4,1,power_law_1.01,0.24388480186462402
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,4,1,power_law_1.2,0.25057919025421144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,4,1,power_law_1.2,0.251475191116333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,8,1,balanced,0.16387200355529785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,8,1,balanced,0.16448000073432922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,8,1,power_law_1.01,0.15196160078048707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,8,1,power_law_1.01,0.15290240049362183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,8,1,power_law_1.2,0.15356800556182862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,6144,2560,8,160,8,1,power_law_1.2,0.15484800338745117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,1,balanced,1.0439733664194744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,1,balanced,1.0499359766642253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,1,power_law_1.01,1.0307007789611817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,1,power_law_1.01,1.0553919792175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,1,power_law_1.2,1.0855039596557616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,1,power_law_1.2,1.1180288314819335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,128,balanced,0.054042667150497437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,128,balanced,0.05586666862169901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,128,power_law_1.01,0.05321599841117859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,128,power_law_1.01,0.053388798236846925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,128,power_law_1.2,0.05297279953956604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,128,power_law_1.2,0.054054397344589236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,16,balanced,0.24356265862782797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,16,balanced,0.24811200300852457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,16,power_law_1.01,0.1662783980369568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,16,power_law_1.01,0.18486399650573732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,16,power_law_1.2,0.15898879766464233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,16,power_law_1.2,0.16885119676589966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,2,balanced,0.48867201805114746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,2,balanced,0.48949865500132245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,2,power_law_1.01,0.4571648120880127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,2,power_law_1.01,0.4677120208740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,2,power_law_1.2,0.4936192035675049
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,2,power_law_1.2,0.4965504169464111
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,256,balanced,0.05203733344872793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,256,balanced,0.05277866621812185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,256,power_law_1.01,0.05089920163154602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,256,power_law_1.01,0.0514303982257843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,256,power_law_1.2,0.05185920000076294
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,256,power_law_1.2,0.05208960175514221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,32,balanced,0.09322133660316467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,32,balanced,0.09506666660308838
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,32,power_law_1.01,0.09031040072441102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,32,power_law_1.01,0.09098880290985108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,32,power_law_1.2,0.08504319787025452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,32,power_law_1.2,0.08647680282592773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,4,balanced,0.2716853419939677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,4,balanced,0.272213339805603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,4,power_law_1.01,0.25319039821624756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,4,power_law_1.01,0.26206719875335693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,4,power_law_1.2,0.2561280012130737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,4,power_law_1.2,0.26261119842529296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,64,balanced,0.07039999961853027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,64,balanced,0.07167466481526692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,64,power_law_1.01,0.06403200030326843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,64,power_law_1.01,0.06448000073432922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,64,power_law_1.2,0.06455680131912231
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,64,power_law_1.2,0.06506239771842956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,8,balanced,0.19810134172439575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,8,balanced,0.1984106699625651
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,8,power_law_1.01,0.16143360137939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,8,power_law_1.01,0.16298240423202515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,8,power_law_1.2,0.164300799369812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,1,8,power_law_1.2,0.1730239987373352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,16,1,balanced,0.18362132708231607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,16,1,balanced,0.18473066886266074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,16,1,power_law_1.01,0.17956479787826538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,16,1,power_law_1.01,0.1799232006072998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,16,1,power_law_1.2,0.182860803604126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,16,1,power_law_1.2,0.18336000442504882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,2,1,balanced,0.5486293236414591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,2,1,balanced,0.5512906710306803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,2,1,power_law_1.01,0.5324160099029541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,2,1,power_law_1.01,0.5484928131103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,2,1,power_law_1.2,0.5607295989990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,2,1,power_law_1.2,0.5684224128723144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,32,1,balanced,0.16404799620310465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,32,1,balanced,0.16475733121236166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,32,1,power_law_1.01,0.15987199544906616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,32,1,power_law_1.01,0.16035200357437135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,32,1,power_law_1.2,0.16243840456008912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,32,1,power_law_1.2,0.16344959735870362
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,4,1,balanced,0.3232853412628174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,4,1,balanced,0.327237327893575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,4,1,power_law_1.01,0.31334400177001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,4,1,power_law_1.01,0.3147455930709839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,4,1,power_law_1.2,0.3231679916381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,4,1,power_law_1.2,0.32554240226745607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,8,1,balanced,0.22503467400868735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,8,1,balanced,0.22522666056950888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,8,1,power_law_1.01,0.2172032117843628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,8,1,power_law_1.01,0.21727359294891357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,8,1,power_law_1.2,0.22248320579528807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,256,8,1,power_law_1.2,0.22351999282836915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,1,balanced,1.3633440335591633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,1,balanced,1.3649546305338542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,1,power_law_1.01,1.255782413482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,1,power_law_1.01,1.2751168251037597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,1,power_law_1.2,1.3019840240478515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,1,power_law_1.2,1.3152000427246093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,128,balanced,0.05986666679382324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,128,balanced,0.060175999999046326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,128,power_law_1.01,0.05788159966468811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,128,power_law_1.01,0.058303999900817874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,128,power_law_1.2,0.057043200731277464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,128,power_law_1.2,0.058380800485610965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,16,balanced,0.1579146683216095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,16,balanced,0.1585493286450704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,16,power_law_1.01,0.12065279483795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,16,power_law_1.01,0.12578560113906861
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,16,power_law_1.2,0.12090239524841309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,16,power_law_1.2,0.13220479488372802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,2,balanced,0.7075839837392172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,2,balanced,0.7091733614603678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,2,power_law_1.01,0.6959743976593018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,2,power_law_1.01,0.7015103816986084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,2,power_law_1.2,0.6824960231781005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,2,power_law_1.2,0.6975935935974121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,32,balanced,0.187226672967275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,32,balanced,0.19662400086720785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,32,power_law_1.01,0.1461951971054077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,32,power_law_1.01,0.1583359956741333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,32,power_law_1.2,0.12328319549560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,32,power_law_1.2,0.1233407974243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,4,balanced,0.37514666716257733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,4,balanced,0.3752640088399251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,4,power_law_1.01,0.3265919923782349
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,4,power_law_1.01,0.3367167949676514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,4,power_law_1.2,0.32371840476989744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,4,power_law_1.2,0.3334208011627197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,64,balanced,0.08683199683825175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,64,balanced,0.08707200487454732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,64,power_law_1.01,0.08232319951057435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,64,power_law_1.01,0.0825984001159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,64,power_law_1.2,0.0782144010066986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,64,power_law_1.2,0.08138239979743958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,8,balanced,0.2172159949938456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,8,balanced,0.21732799212137857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,8,power_law_1.01,0.18892159461975097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,8,power_law_1.01,0.20028159618377686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,8,power_law_1.2,0.19103360176086426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,1,8,power_law_1.2,0.19713280200958253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,16,1,balanced,0.18648000558217367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,16,1,balanced,0.18986133734385172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,16,1,power_law_1.01,0.20208640098571778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,16,1,power_law_1.01,0.20325760841369628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,16,1,power_law_1.2,0.20330240726470947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,16,1,power_law_1.2,0.2035072088241577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,2,1,balanced,0.715669314066569
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,2,1,balanced,0.717408021291097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,2,1,power_law_1.01,0.6538112163543701
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,2,1,power_law_1.01,0.6628992080688476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,2,1,power_law_1.2,0.6646207809448242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,2,1,power_law_1.2,0.6727039813995361
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,32,1,balanced,0.15850133697191873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,32,1,balanced,0.16038399934768677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,32,1,power_law_1.01,0.17820160388946532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,32,1,power_law_1.01,0.17932800054550171
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,32,1,power_law_1.2,0.17859840393066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,32,1,power_law_1.2,0.18273919820785522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,4,1,balanced,0.39666132132212323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,4,1,balanced,0.39693331718444824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,4,1,power_law_1.01,0.3733247995376587
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,4,1,power_law_1.01,0.37900800704956056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,4,1,power_law_1.2,0.3814079999923706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,4,1,power_law_1.2,0.3829375982284546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,8,1,balanced,0.24546132485071817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,8,1,balanced,0.24649600187937418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,8,1,power_law_1.01,0.25189759731292727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,8,1,power_law_1.01,0.25231359004974363
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,8,1,power_law_1.2,0.25384318828582764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,384,7168,2048,8,384,8,1,power_law_1.2,0.25397119522094724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,1,balanced,0.03350399931271871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,1,balanced,0.03555200000603994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,1,power_law_1.01,0.03761920034885406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,1,power_law_1.01,0.03811840116977692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,1,power_law_1.2,0.0331712007522583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,1,power_law_1.2,0.03518719971179962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,128,balanced,0.023423999547958374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,128,balanced,0.025205334027608235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,128,power_law_1.01,0.022124800086021423
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,128,power_law_1.01,0.023609599471092223
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,128,power_law_1.2,0.02172800004482269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,128,power_law_1.2,0.022201600670814513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,16,balanced,0.023215999205907185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,16,balanced,0.023376000424226124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,16,power_law_1.01,0.023552000522613525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,16,power_law_1.01,0.023647999763488768
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,16,power_law_1.2,0.023871999979019166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,16,power_law_1.2,0.024160000681877136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,2,balanced,0.029461334149042766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,2,balanced,0.029493334392706554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,2,power_law_1.01,0.02919679880142212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,2,power_law_1.01,0.0313728004693985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,2,power_law_1.2,0.028467199206352232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,2,power_law_1.2,0.030329599976539612
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,32,balanced,0.023269332945346832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,32,balanced,0.025173333783944447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,32,power_law_1.01,0.02295680046081543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,32,power_law_1.01,0.02305919975042343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,32,power_law_1.2,0.021139200031757354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,32,power_law_1.2,0.022310400009155275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,4,balanced,0.02693866689999898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,4,balanced,0.02720533311367035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,4,power_law_1.01,0.026291200518608095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,4,power_law_1.01,0.028019198775291444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,4,power_law_1.2,0.02622080147266388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,4,power_law_1.2,0.02627840042114258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,64,balanced,0.023178666830062866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,64,balanced,0.025301332275072735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,64,power_law_1.01,0.021779200434684752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,64,power_law_1.01,0.023788799345493317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,64,power_law_1.2,0.021555200219154358
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,64,power_law_1.2,0.02181120067834854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,8,balanced,0.025114665428797405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,8,balanced,0.025519999365011852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,8,power_law_1.01,0.025516799092292784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,8,power_law_1.01,0.025561600923538208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,8,power_law_1.2,0.026707199215888978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,1,8,power_law_1.2,0.027327999472618103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,2,1,balanced,0.029296000798543293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,2,1,balanced,0.029466666281223297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,2,1,power_law_1.01,0.029286399483680725
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,2,1,power_law_1.01,0.029843199253082275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,2,1,power_law_1.2,0.028326401114463808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,2,1,power_law_1.2,0.02913280129432678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,4,1,balanced,0.02718399961789449
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,4,1,balanced,0.02808533360560735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,4,1,power_law_1.01,0.02484479993581772
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,4,1,power_law_1.01,0.025164800882339477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,4,1,power_law_1.2,0.024607999622821806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,2048,768,8,128,4,1,power_law_1.2,0.025113600492477416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,1,balanced,0.064560001095136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,1,balanced,0.06599466502666473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,1,power_law_1.01,0.06307839751243591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,1,power_law_1.01,0.06407039761543273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,1,power_law_1.2,0.06357120275497437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,1,power_law_1.2,0.06401919722557067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,128,balanced,0.023168000082174938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,128,balanced,0.02518400053183238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,128,power_law_1.01,0.0230335995554924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,128,power_law_1.01,0.02366719990968704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,128,power_law_1.2,0.022463999688625336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,128,power_law_1.2,0.02295680046081543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,16,balanced,0.025407999753952026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,16,balanced,0.027349332968393963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,16,power_law_1.01,0.045491200685501096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,16,power_law_1.01,0.04625920057296753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,16,power_law_1.2,0.043808001279830935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,16,power_law_1.2,0.04446719884872437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,2,balanced,0.045781334241231285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,2,balanced,0.04595733185609182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,2,power_law_1.01,0.055193597078323366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,2,power_law_1.01,0.05620480179786682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,2,power_law_1.2,0.053862398862838744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,2,power_law_1.2,0.054739201068878175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,256,balanced,0.02679466704527537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,256,balanced,0.027162666122118633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,256,power_law_1.01,0.02285439968109131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,256,power_law_1.01,0.02372480034828186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,256,power_law_1.2,0.022995199263095855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,256,power_law_1.2,0.023391999304294586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,32,balanced,0.025978667040665943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,32,balanced,0.02717333287000656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,32,power_law_1.01,0.028377598524093627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,32,power_law_1.01,0.02961919903755188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,32,power_law_1.2,0.028288000822067262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,32,power_law_1.2,0.028723201155662535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,4,balanced,0.030608000854651134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,4,balanced,0.03142933299144109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,4,power_law_1.01,0.05193600058555603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,4,power_law_1.01,0.05275520086288452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,4,power_law_1.2,0.04751999974250794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,4,power_law_1.2,0.04844799935817719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,64,balanced,0.025194667279720306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,64,balanced,0.0252960001428922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,64,power_law_1.01,0.02588160037994385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,64,power_law_1.01,0.02698880136013031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,64,power_law_1.2,0.026131200790405273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,64,power_law_1.2,0.026464000344276428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,8,balanced,0.02737066646416982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,8,balanced,0.027503999571005504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,8,power_law_1.01,0.05141760110855102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,8,power_law_1.01,0.05214080214500427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,8,power_law_1.2,0.040915200114250184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,1,8,power_law_1.2,0.0456063985824585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,2,1,balanced,0.04613866905371348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,2,1,balanced,0.047557334105173744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,2,1,power_law_1.01,0.046700799465179445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,2,1,power_law_1.01,0.04739840030670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,2,1,power_law_1.2,0.04629760086536407
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,2,1,power_law_1.2,0.047091200947761536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,4,1,balanced,0.03155199935038885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,4,1,balanced,0.032245332996050514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,4,1,power_law_1.01,0.03213439881801605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,4,1,power_law_1.01,0.03224959969520569
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,4,1,power_law_1.2,0.032601600885391234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,4,1,power_law_1.2,0.034092798829078674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,8,1,balanced,0.027984000742435455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,8,1,balanced,0.028229333460330963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,8,1,power_law_1.01,0.02746239900588989
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,8,1,power_law_1.01,0.028543999791145323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,8,1,power_law_1.2,0.027795198559761047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,3072,1536,8,256,8,1,power_law_1.2,0.029043200612068176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,1,balanced,0.1395680010318756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,1,balanced,0.1399679978688558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,1,power_law_1.01,0.08725119829177856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,1,power_law_1.01,0.09726719856262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,1,power_law_1.2,0.08441600203514099
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,1,power_law_1.2,0.09106559753417968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,2,balanced,0.08380267024040222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,2,balanced,0.08545600374539693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,2,power_law_1.01,0.06478719711303711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,2,power_law_1.01,0.06757760047912598
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,2,power_law_1.2,0.057631999254226685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,2,power_law_1.2,0.0670144021511078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,4,balanced,0.058517331878344216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,4,balanced,0.059845333298047386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,4,power_law_1.01,0.052172797918319705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,4,power_law_1.01,0.056358402967453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,4,power_law_1.2,0.05050240159034729
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,4,power_law_1.2,0.054579198360443115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,8,balanced,0.04191466669241587
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,8,balanced,0.04370133578777313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,8,power_law_1.01,0.04110080003738403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,8,power_law_1.01,0.04151679873466492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,8,power_law_1.2,0.039955198764801025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,1,8,power_law_1.2,0.04196479916572571
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,16,1,balanced,0.029445332785447437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,16,1,balanced,0.02956799914439519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,16,1,power_law_1.01,0.025017601251602174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,16,1,power_law_1.01,0.02736639976501465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,16,1,power_law_1.2,0.025472000241279602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,16,1,power_law_1.2,0.02648960053920746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,2,1,balanced,0.08443199594815572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,2,1,balanced,0.08481599887212117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,2,1,power_law_1.01,0.05917440056800842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,2,1,power_law_1.01,0.062003201246261595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,2,1,power_law_1.2,0.06111999750137329
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,2,1,power_law_1.2,0.06317440271377564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,32,1,balanced,0.025397333006064098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,32,1,balanced,0.029146666328112285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,32,1,power_law_1.01,0.024556800723075867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,32,1,power_law_1.01,0.026931199431419372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,32,1,power_law_1.2,0.02566399872303009
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,32,1,power_law_1.2,0.02640640139579773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,4,1,balanced,0.057487999399503074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,4,1,balanced,0.058005332946777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,4,1,power_law_1.01,0.04257920086383819
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,4,1,power_law_1.01,0.042656001448631284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,4,1,power_law_1.2,0.04085760116577149
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,4,1,power_law_1.2,0.043321600556373595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,8,1,balanced,0.03707200040419897
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,8,1,balanced,0.037845333417256675
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,8,1,power_law_1.01,0.029747200012207032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,8,1,power_law_1.01,0.031071999669075014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,8,1,power_law_1.2,0.027577599883079527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,14336,2,8,8,1,power_law_1.2,0.028825598955154418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,1,balanced,0.07660800218582153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,1,balanced,0.07668800155321757
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,1,power_law_1.01,0.07367680072784424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,1,power_law_1.01,0.07553920149803162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,1,power_law_1.2,0.06984320282936096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,1,power_law_1.2,0.07017599940299987
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,128,balanced,0.027210667729377747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,128,balanced,0.027461332579453785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,128,power_law_1.01,0.025472000241279602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,128,power_law_1.01,0.025772801041603087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,128,power_law_1.2,0.024633599817752837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,128,power_law_1.2,0.025651198625564576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,16,balanced,0.027109332382678986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,16,balanced,0.027386667827765148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,16,power_law_1.01,0.03213439881801605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,16,power_law_1.01,0.0323199987411499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,16,power_law_1.2,0.03237119913101196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,16,power_law_1.2,0.03250559866428375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,2,balanced,0.05338666836420695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,2,balanced,0.053616002202034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,2,power_law_1.01,0.05720319747924805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,2,power_law_1.01,0.05726720094680786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,2,power_law_1.2,0.056857597827911374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,2,power_law_1.2,0.05742719769477844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,32,balanced,0.025818665822347004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,32,balanced,0.026506667335828144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,32,power_law_1.01,0.02587519884109497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,32,power_law_1.01,0.02619520127773285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,32,power_law_1.2,0.02588160037994385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,32,power_law_1.2,0.02595840096473694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,4,balanced,0.0329120010137558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,4,balanced,0.036730666955312095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,4,power_law_1.01,0.04929920136928558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,4,power_law_1.01,0.05008640289306641
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,4,power_law_1.2,0.04286080002784729
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,4,power_law_1.2,0.04611839950084686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,64,balanced,0.025285333395004272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,64,balanced,0.02722666660944621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,64,power_law_1.01,0.024255999922752382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,64,power_law_1.01,0.025785601139068602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,64,power_law_1.2,0.023705600202083586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,64,power_law_1.2,0.02534399926662445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,8,balanced,0.02770666778087616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,8,balanced,0.028416000306606293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,8,power_law_1.01,0.03896960020065308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,8,power_law_1.01,0.03909760117530823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,8,power_law_1.2,0.04340479969978332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,1,8,power_law_1.2,0.04424319863319397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,2,1,balanced,0.05489600201447805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,2,1,balanced,0.05561066667238871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,2,1,power_law_1.01,0.05330560207366943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,2,1,power_law_1.01,0.053574401140213015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,2,1,power_law_1.2,0.050969600677490234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,2,1,power_law_1.2,0.05120639801025391
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,4,1,balanced,0.035589332381884255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,4,1,balanced,0.03570133447647095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,4,1,power_law_1.01,0.03649280071258545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,4,1,power_law_1.01,0.04026240110397339
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,4,1,power_law_1.2,0.03649280071258545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,4,1,power_law_1.2,0.038649600744247434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,8,1,balanced,0.02976000060637792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,8,1,balanced,0.031397332747777305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,8,1,power_law_1.01,0.030508801341056824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,8,1,power_law_1.01,0.03142400085926056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,8,1,power_law_1.2,0.028934401273727418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,4096,1536,8,128,8,1,power_law_1.2,0.02968960106372833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,1,balanced,0.21770666042963663
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,1,balanced,0.21945067246754965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,1,power_law_1.01,0.13515520095825195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,1,power_law_1.01,0.1392832040786743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,1,power_law_1.2,0.13731839656829833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,1,power_law_1.2,0.13780479431152343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,2,balanced,0.12638933459917703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,2,balanced,0.12771733601888022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,2,power_law_1.01,0.08524799942970276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,2,power_law_1.01,0.09102720022201538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,2,power_law_1.2,0.096697598695755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,2,power_law_1.2,0.11112320423126221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,4,balanced,0.07758399844169617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,4,balanced,0.07872533301512401
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,4,power_law_1.01,0.06312320232391358
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,4,power_law_1.01,0.06826239824295044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,4,power_law_1.2,0.06504319906234741
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,4,power_law_1.2,0.0769536018371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,8,balanced,0.055306668082873024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,8,balanced,0.0562720000743866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,8,power_law_1.01,0.05336959958076477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,8,power_law_1.01,0.05408639907836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,8,power_law_1.2,0.0536575973033905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,1,8,power_law_1.2,0.05514879822731018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,16,1,balanced,0.03251733382542928
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,16,1,balanced,0.03379199902216593
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,16,1,power_law_1.01,0.027961599826812743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,16,1,power_law_1.01,0.028787198662757873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,16,1,power_law_1.2,0.02805759906768799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,16,1,power_law_1.2,0.029209598898887634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,2,1,balanced,0.1243893305460612
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,2,1,balanced,0.1256480018297831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,2,1,power_law_1.01,0.08227840065956116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,2,1,power_law_1.01,0.09657599925994872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,2,1,power_law_1.2,0.08330879807472229
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,2,1,power_law_1.2,0.08401280045509338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,32,1,balanced,0.028463999430338543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,32,1,balanced,0.03017599880695343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,32,1,power_law_1.01,0.02640640139579773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,32,1,power_law_1.01,0.027091199159622194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,32,1,power_law_1.2,0.026208001375198364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,4,1,balanced,0.07813866436481476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,4,1,balanced,0.07875200112660725
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,4,1,power_law_1.01,0.05379199981689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,4,1,power_law_1.01,0.05676159858703613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,4,1,power_law_1.2,0.05249279737472534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,4,1,power_law_1.2,0.053932797908782956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,8,1,balanced,0.05305066704750061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,8,1,balanced,0.05379733443260193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,8,1,power_law_1.01,0.03819519877433777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,8,1,power_law_1.01,0.03978880047798157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,8,1,power_law_1.2,0.03612799942493439
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,16384,2,8,8,1,power_law_1.2,0.04195199906826019
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,1,balanced,0.1244053343931834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,1,balanced,0.1244586706161499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,1,power_law_1.01,0.12017920017242431
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,1,power_law_1.01,0.1221119999885559
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,1,power_law_1.2,0.12183680534362792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,1,power_law_1.2,0.12189439535140992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,128,balanced,0.0281333327293396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,128,balanced,0.029472000896930695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,128,power_law_1.01,0.02698880136013031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,128,power_law_1.01,0.02901119887828827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,128,power_law_1.2,0.026943999528884887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,128,power_law_1.2,0.027398398518562316
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,16,balanced,0.02945599953333537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,16,balanced,0.02997333308060964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,16,power_law_1.01,0.07381119728088378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,16,power_law_1.01,0.07420160174369812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,16,power_law_1.2,0.0693120002746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,16,power_law_1.2,0.0711296021938324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,2,balanced,0.07689600189526875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,2,balanced,0.07849599917729695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,2,power_law_1.01,0.09673600196838379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,2,power_law_1.01,0.10331519842147827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,2,power_law_1.2,0.09516159892082214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,2,power_law_1.2,0.09724159836769104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,256,balanced,0.027093333502610523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,256,balanced,0.027600000301996868
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,256,power_law_1.01,0.026092800498008727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,256,power_law_1.01,0.027315199375152588
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,256,power_law_1.2,0.025472000241279602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,256,power_law_1.2,0.02547839879989624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,32,balanced,0.027664000789324444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,32,balanced,0.029264000554879505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,32,power_law_1.01,0.05156480073928833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,32,power_law_1.01,0.05275520086288452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,32,power_law_1.2,0.051974397897720334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,32,power_law_1.2,0.05325440168380737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,4,balanced,0.05382933219273885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,4,balanced,0.05402133365472158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,4,power_law_1.01,0.08824959993362427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,4,power_law_1.01,0.09275519847869873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,4,power_law_1.2,0.07973759770393371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,4,power_law_1.2,0.08021119832992554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,64,balanced,0.027509334186712902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,64,balanced,0.029290666182835896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,64,power_law_1.01,0.031865599751472476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,64,power_law_1.01,0.03249920010566711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,64,power_law_1.2,0.031142398715019226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,64,power_law_1.2,0.03329919874668121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,8,balanced,0.03350399931271871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,8,balanced,0.03573333223660787
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,8,power_law_1.01,0.07863039970397949
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,8,power_law_1.01,0.08442879915237426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,8,power_law_1.2,0.07364479899406433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,1,8,power_law_1.2,0.07454079985618592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,16,1,balanced,0.0315786674618721
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,16,1,balanced,0.033173332611719765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,16,1,power_law_1.01,0.031225600838661195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,16,1,power_law_1.01,0.031999999284744264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,16,1,power_law_1.2,0.0321727991104126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,16,1,power_law_1.2,0.03447040021419525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,2,1,balanced,0.07702933251857758
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,2,1,balanced,0.07817600170771281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,2,1,power_law_1.01,0.07538560032844543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,2,1,power_law_1.01,0.07675520181655884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,2,1,power_law_1.2,0.07610880136489868
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,2,1,power_law_1.2,0.07615360021591186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,32,1,balanced,0.03138133386770884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,32,1,balanced,0.032405334214369454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,32,1,power_law_1.01,0.0304639995098114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,32,1,power_law_1.01,0.031040000915527343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,32,1,power_law_1.2,0.030092799663543703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,32,1,power_law_1.2,0.030393600463867188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,4,1,balanced,0.0553653339544932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,4,1,balanced,0.05553600192070007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,4,1,power_law_1.01,0.05258240103721619
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,4,1,power_law_1.01,0.05272960066795349
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,4,1,power_law_1.2,0.05281280279159546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,4,1,power_law_1.2,0.05289599895477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,8,1,balanced,0.0346666673819224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,8,1,balanced,0.03700266778469086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,8,1,power_law_1.01,0.03694080114364624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,8,1,power_law_1.01,0.037427198886871335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,8,1,power_law_1.2,0.036831998825073244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2048,8,256,8,1,power_law_1.2,0.03726719915866852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,1,balanced,0.14657066265741983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,1,balanced,0.14757333199183145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,1,power_law_1.01,0.1441151976585388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,1,power_law_1.01,0.14426239728927612
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,1,power_law_1.2,0.141484797000885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,1,power_law_1.2,0.1435263991355896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,16,balanced,0.029343999922275543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,16,balanced,0.029472000896930695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,16,power_law_1.01,0.06441599726676941
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,16,power_law_1.01,0.06502400040626526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,16,power_law_1.2,0.061849600076675414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,16,power_law_1.2,0.06444799900054932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,2,balanced,0.08959466218948364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,2,balanced,0.09088533123334248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,2,power_law_1.01,0.10743680000305175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,2,power_law_1.01,0.10869120359420777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,2,power_law_1.2,0.10242559909820556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,2,power_law_1.2,0.1102720022201538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,32,balanced,0.029317334294319153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,32,balanced,0.029743999242782593
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,32,power_law_1.01,0.0469184011220932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,32,power_law_1.01,0.04782719910144806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,32,power_law_1.2,0.045542401075363156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,32,power_law_1.2,0.04657280147075653
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,4,balanced,0.060821334520975746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,4,balanced,0.060975998640060425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,4,power_law_1.01,0.0824895977973938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,4,power_law_1.01,0.09047679901123047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,4,power_law_1.2,0.08359040021896362
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,4,power_law_1.2,0.08448640108108521
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,8,balanced,0.04165866722663244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,8,balanced,0.04179200033346812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,8,power_law_1.01,0.0725055992603302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,8,power_law_1.01,0.07688959836959838
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,8,power_law_1.2,0.07212160229682922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,1,8,power_law_1.2,0.07223039865493774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,2,1,balanced,0.08967467149098714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,2,1,balanced,0.09054399530092876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,2,1,power_law_1.01,0.08848000168800355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,2,1,power_law_1.01,0.08938239812850952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,2,1,power_law_1.2,0.08727040290832519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,2,1,power_law_1.2,0.08792960047721862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,4,1,balanced,0.06451199948787689
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,4,1,balanced,0.06490133206049602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,4,1,power_law_1.01,0.06158080101013184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,4,1,power_law_1.01,0.06259840130805969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,4,1,power_law_1.2,0.06239359974861145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,4,1,power_law_1.2,0.0627839982509613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,8,1,balanced,0.04266133407751719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,8,1,balanced,0.04562133550643921
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,8,1,power_law_1.01,0.046265599131584165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,8,1,power_law_1.01,0.04645119905471802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,8,1,power_law_1.2,0.044435200095176694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,6144,2560,8,160,8,1,power_law_1.2,0.04535680115222931
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,1,balanced,0.13942399621009827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,1,balanced,0.139765332142512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,1,power_law_1.01,0.13726719617843627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,1,power_law_1.01,0.13834240436553955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,1,power_law_1.2,0.13594239950180054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,1,power_law_1.2,0.13693439960479736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,128,balanced,0.029520000020662945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,128,balanced,0.03014400104681651
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,128,power_law_1.01,0.027449598908424376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,128,power_law_1.01,0.028672000765800475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,128,power_law_1.2,0.02805759906768799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,128,power_law_1.2,0.02953599989414215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,16,balanced,0.029370665550231934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,16,balanced,0.031301334500312805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,16,power_law_1.01,0.08364800214767457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,16,power_law_1.01,0.08370559811592101
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,16,power_law_1.2,0.07847679853439331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,16,power_law_1.2,0.07916799783706666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,2,balanced,0.08571199576059978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,2,balanced,0.08672533432642619
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,2,power_law_1.01,0.11793919801712036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,2,power_law_1.01,0.11820160150527954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,2,power_law_1.2,0.09652479887008666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,2,power_law_1.2,0.10209920406341552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,256,balanced,0.02731200059254964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,256,balanced,0.027914665639400482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,256,power_law_1.01,0.026528000831604004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,256,power_law_1.01,0.028441599011421202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,256,power_law_1.2,0.02717440128326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,256,power_law_1.2,0.028595200181007384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,32,balanced,0.029279999434947968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,32,balanced,0.029445332785447437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,32,power_law_1.01,0.054604798555374146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,32,power_law_1.01,0.056979197263717654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,32,power_law_1.2,0.05440639853477478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,32,power_law_1.2,0.05644800066947937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,4,balanced,0.05766933163007101
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,4,balanced,0.05816000203291575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,4,power_law_1.01,0.10377600193023681
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,4,power_law_1.01,0.10586240291595458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,4,power_law_1.2,0.0870848000049591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,4,power_law_1.2,0.09964159727096558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,64,balanced,0.029290666182835896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,64,balanced,0.029493334392706554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,64,power_law_1.01,0.03590399920940399
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,64,power_law_1.01,0.03632639944553375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,64,power_law_1.2,0.0353983998298645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,64,power_law_1.2,0.03672960102558136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,8,balanced,0.03782933453718821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,8,balanced,0.039706667264302574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,8,power_law_1.01,0.09165440201759338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,8,power_law_1.01,0.09462400078773499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,8,power_law_1.2,0.0855679988861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,1,8,power_law_1.2,0.09080320000648498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,16,1,balanced,0.0335413341720899
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,16,1,balanced,0.035936000446478523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,16,1,power_law_1.01,0.03283840119838714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,16,1,power_law_1.01,0.03527039885520935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,16,1,power_law_1.2,0.03415679931640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,16,1,power_law_1.2,0.035078400373458864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,2,1,balanced,0.08448533217112224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,2,1,balanced,0.08687466382980347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,2,1,power_law_1.01,0.08376320004463196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,2,1,power_law_1.01,0.08509439826011658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,2,1,power_law_1.2,0.08364800214767457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,2,1,power_law_1.2,0.08442879915237426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,32,1,balanced,0.03370666752258936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,32,1,balanced,0.034517332911491394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,32,1,power_law_1.01,0.03216640055179596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,32,1,power_law_1.01,0.033913600444793704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,32,1,power_law_1.2,0.03170560002326965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,32,1,power_law_1.2,0.03251200020313263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,4,1,balanced,0.059248000383377075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,4,1,balanced,0.059978668888409935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,4,1,power_law_1.01,0.057555198669433594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,4,1,power_law_1.01,0.05845119953155518
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,4,1,power_law_1.2,0.056806397438049314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,4,1,power_law_1.2,0.05802879929542541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,8,1,balanced,0.03991466760635376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,8,1,balanced,0.04165866722663244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,8,1,power_law_1.01,0.04108160138130188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,8,1,power_law_1.01,0.041382399201393125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,8,1,power_law_1.2,0.04059520065784454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,256,8,1,power_law_1.2,0.04097279906272888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,1,balanced,0.13903466860453287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,1,balanced,0.14034133156140646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,1,power_law_1.01,0.13838080167770386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,1,power_law_1.01,0.13939839601516724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,1,power_law_1.2,0.13770240545272827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,1,power_law_1.2,0.13850239515304566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,128,balanced,0.029157333076000214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,128,balanced,0.029525332152843475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,128,power_law_1.01,0.029209598898887634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,128,power_law_1.01,0.029337599873542786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,128,power_law_1.2,0.030048000812530517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,128,power_law_1.2,0.03056640028953552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,16,balanced,0.02956266701221466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,16,balanced,0.03147733211517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,16,power_law_1.01,0.10900479555130005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,16,power_law_1.01,0.11193599700927734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,16,power_law_1.2,0.09751039743423462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,16,power_law_1.2,0.10337920188903808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,2,balanced,0.08546666304270427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,2,balanced,0.08681066830952962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,2,power_law_1.01,0.1373695969581604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,2,power_law_1.01,0.1375040054321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,2,power_law_1.2,0.11989120244979859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,2,power_law_1.2,0.125491201877594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,32,balanced,0.029552000264326733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,32,balanced,0.031002665559450786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,32,power_law_1.01,0.06922879815101624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,32,power_law_1.01,0.0711359977722168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,32,power_law_1.2,0.06824319958686828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,32,power_law_1.2,0.07027199864387512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,4,balanced,0.05625600119431814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,4,balanced,0.05788266658782959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,4,power_law_1.01,0.13738880157470704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,4,power_law_1.01,0.13772799968719482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,4,power_law_1.2,0.1087615966796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,4,power_law_1.2,0.11498880386352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,64,balanced,0.029557332396507263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,64,balanced,0.030234667162100475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,64,power_law_1.01,0.05062400102615357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,64,power_law_1.01,0.051648002862930295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,64,power_law_1.2,0.05025920271873474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,64,power_law_1.2,0.05085440278053284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,8,balanced,0.03753600021203359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,8,balanced,0.039813332259655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,8,power_law_1.01,0.13827199935913087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,8,power_law_1.01,0.1384703993797302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,8,power_law_1.2,0.1087231993675232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,1,8,power_law_1.2,0.11102720499038696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,16,1,balanced,0.03405333310365677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,16,1,balanced,0.03485333422819773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,16,1,power_law_1.01,0.032076799869537355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,16,1,power_law_1.01,0.032671999931335446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,16,1,power_law_1.2,0.0344895988702774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,16,1,power_law_1.2,0.03454079926013946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,2,1,balanced,0.08635733524958293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,2,1,balanced,0.08681066830952962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,2,1,power_law_1.01,0.08309760093688964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,2,1,power_law_1.01,0.08457599878311158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,2,1,power_law_1.2,0.08478080034255982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,2,1,power_law_1.2,0.08541439771652222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,32,1,balanced,0.03356799980004629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,32,1,balanced,0.03571200122435888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,32,1,power_law_1.01,0.03160319924354553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,32,1,power_law_1.01,0.03200640082359314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,32,1,power_law_1.2,0.031564798951148984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,32,1,power_law_1.2,0.03166080117225647
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,4,1,balanced,0.05811200042565664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,4,1,balanced,0.05843733251094818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,4,1,power_law_1.01,0.05603839755058289
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,4,1,power_law_1.01,0.05737599730491638
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,4,1,power_law_1.2,0.056729602813720706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,4,1,power_law_1.2,0.058233600854873654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,8,1,balanced,0.03944533318281174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,8,1,balanced,0.03984000037113825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,8,1,power_law_1.01,0.039027199149131775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,8,1,power_law_1.01,0.04030719995498657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,8,1,power_law_1.2,0.040934398770332336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4,7168,2048,8,384,8,1,power_law_1.2,0.041440001130104064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,1,balanced,0.24219733476638794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,1,balanced,0.24813334147135416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,1,power_law_1.01,0.283187198638916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,1,power_law_1.01,0.29205760955810545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,1,power_law_1.2,0.2880511999130249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,1,power_law_1.2,0.2928639888763428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,128,balanced,0.0664106657107671
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,128,balanced,0.06643199920654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,128,power_law_1.01,0.07144320011138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,128,power_law_1.01,0.07149440050125122
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,128,power_law_1.2,0.07788159847259521
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,128,power_law_1.2,0.08090879917144775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,16,balanced,0.07539199789365132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,16,balanced,0.07866133252779643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,16,power_law_1.01,0.09237120151519776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,16,power_law_1.01,0.09278079867362976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,16,power_law_1.2,0.09472640156745911
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,16,power_law_1.2,0.1000704050064087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,2,balanced,0.15478400389353433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,2,balanced,0.15588800112406412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,2,power_law_1.01,0.18675199747085572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,2,power_law_1.01,0.19104000329971313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,2,power_law_1.2,0.19073280096054077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,2,power_law_1.2,0.1922816038131714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,32,balanced,0.06865066786607106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,32,balanced,0.07192533214886983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,32,power_law_1.01,0.08060160279273987
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,32,power_law_1.01,0.08364160060882568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,32,power_law_1.2,0.08999040126800537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,32,power_law_1.2,0.09315199851989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,4,balanced,0.11518399914105733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,4,balanced,0.1159946620464325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,4,power_law_1.01,0.1328384041786194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,4,power_law_1.01,0.13941119909286498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,4,power_law_1.2,0.1341375946998596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,4,power_law_1.2,0.1404096007347107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,64,balanced,0.0666133314371109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,64,balanced,0.06880533198515575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,64,power_law_1.01,0.07530239820480347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,64,power_law_1.01,0.07580800056457519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,64,power_law_1.2,0.084934401512146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,64,power_law_1.2,0.08683519959449768
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,8,balanced,0.09091200431187947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,8,balanced,0.09108799695968628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,8,power_law_1.01,0.10901119709014892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,8,power_law_1.01,0.11043839454650879
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,8,power_law_1.2,0.11202559471130372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,1,8,power_law_1.2,0.11670399904251098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,2,1,balanced,0.18717332681020102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,2,1,balanced,0.18897066513697305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,2,1,power_law_1.01,0.2083967924118042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,2,1,power_law_1.01,0.2092223882675171
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,2,1,power_law_1.2,0.21062400341033935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,2,1,power_law_1.2,0.21252479553222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,4,1,balanced,0.1593280037244161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,4,1,balanced,0.16192533572514853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,4,1,power_law_1.01,0.17570559978485106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,4,1,power_law_1.01,0.17872639894485473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,4,1,power_law_1.2,0.17910399436950683
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,2048,768,8,128,4,1,power_law_1.2,0.1797376036643982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,1,balanced,0.5403840144475301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,1,balanced,0.5441386699676514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,1,power_law_1.01,0.6484352111816406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,1,power_law_1.01,0.6513343811035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,1,power_law_1.2,0.6709440231323243
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,1,power_law_1.2,0.6754879951477051
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,128,balanced,0.08319999774297078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,128,balanced,0.08659733335177104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,128,power_law_1.01,0.09832320213317872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,128,power_law_1.01,0.10011520385742187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,128,power_law_1.2,0.10097919702529908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,128,power_law_1.2,0.10540800094604492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,16,balanced,0.11699733138084412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,16,balanced,0.11762133240699768
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,16,power_law_1.01,0.13890559673309327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,16,power_law_1.01,0.14382719993591309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,16,power_law_1.2,0.15175679922103882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,16,power_law_1.2,0.15308159589767456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,2,balanced,0.2781493266423543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,2,balanced,0.27873067061106366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,2,power_law_1.01,0.384115195274353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,2,power_law_1.01,0.39260799884796144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,2,power_law_1.2,0.40508160591125486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,2,power_law_1.2,0.4300992012023926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,256,balanced,0.08223466575145721
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,256,balanced,0.08267199993133545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,256,power_law_1.01,0.09075199961662292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,256,power_law_1.01,0.09093760251998902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,256,power_law_1.2,0.10056320428848267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,256,power_law_1.2,0.10198400020599366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,32,balanced,0.10307199756304423
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,32,balanced,0.10326400399208069
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,32,power_law_1.01,0.11740800142288207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,32,power_law_1.01,0.12132480144500732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,32,power_law_1.2,0.12499200105667115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,32,power_law_1.2,0.128601598739624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,4,balanced,0.18598399559656778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,4,balanced,0.18622400363286337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,4,power_law_1.01,0.2414720058441162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,4,power_law_1.01,0.2444159984588623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,4,power_law_1.2,0.2693120002746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,4,power_law_1.2,0.2751296043395996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,64,balanced,0.08950933814048767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,64,balanced,0.09308266639709473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,64,power_law_1.01,0.10828160047531128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,64,power_law_1.01,0.11090559959411621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,64,power_law_1.2,0.11726080179214478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,64,power_law_1.2,0.12123520374298095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,8,balanced,0.14257599910100302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,8,balanced,0.14274133245150247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,8,power_law_1.01,0.17614079713821412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,8,power_law_1.01,0.17727359533309936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,8,power_law_1.2,0.1807360053062439
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,1,8,power_law_1.2,0.18121600151062012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,2,1,balanced,0.36265599727630615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,2,1,balanced,0.37697064876556396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,2,1,power_law_1.01,0.4184703826904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,2,1,power_law_1.01,0.4185664176940918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,2,1,power_law_1.2,0.43205761909484863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,2,1,power_law_1.2,0.4333695888519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,4,1,balanced,0.25061333179473877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,4,1,balanced,0.25067732731501263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,4,1,power_law_1.01,0.2775615930557251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,4,1,power_law_1.01,0.27915520668029786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,4,1,power_law_1.2,0.2847424030303955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,4,1,power_law_1.2,0.28638079166412356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,8,1,balanced,0.23834667603174844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,8,1,balanced,0.23944532871246338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,8,1,power_law_1.01,0.27130880355834963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,8,1,power_law_1.01,0.28063359260559084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,8,1,power_law_1.2,0.27125120162963867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,3072,1536,8,256,8,1,power_law_1.2,0.2852799892425537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,1,balanced,0.8598986466725668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,1,balanced,0.864245335261027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,1,power_law_1.01,0.9253120422363281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,1,power_law_1.01,0.9418623924255372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,1,power_law_1.2,0.9269760131835938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,1,power_law_1.2,0.9658687591552735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,2,balanced,0.472053329149882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,2,balanced,0.4761333465576172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,2,power_law_1.01,0.6467904090881348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,2,power_law_1.01,0.6594048023223877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,2,power_law_1.2,0.66495361328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,2,power_law_1.2,0.6892288208007813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,4,balanced,0.2925279935201009
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,4,balanced,0.2943999965985616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,4,power_law_1.01,0.5037631988525391
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,4,power_law_1.01,0.5085375785827637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,4,power_law_1.2,0.49485440254211427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,4,power_law_1.2,0.5609216213226318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,8,balanced,0.19724800189336142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,8,balanced,0.19776000579198202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,8,power_law_1.01,0.4304448127746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,8,power_law_1.01,0.4439680099487305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,8,power_law_1.2,0.4476480007171631
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,1,8,power_law_1.2,0.4566976070404053
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,16,1,balanced,0.1580586632092794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,16,1,balanced,0.15862933794657388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,16,1,power_law_1.01,0.16100480556488037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,16,1,power_law_1.01,0.16104960441589355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,16,1,power_law_1.2,0.15998079776763915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,16,1,power_law_1.2,0.16101759672164917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,2,1,balanced,0.4734666744867961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,2,1,balanced,0.4745546579360962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,2,1,power_law_1.01,0.5153984069824219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,2,1,power_law_1.01,0.5341440200805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,2,1,power_law_1.2,0.5049344062805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,2,1,power_law_1.2,0.5453824043273926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,32,1,balanced,0.13873066504796347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,32,1,balanced,0.13961600263913473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,32,1,power_law_1.01,0.1373311996459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,32,1,power_law_1.01,0.13864959478378297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,32,1,power_law_1.2,0.13761279582977295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,32,1,power_law_1.2,0.1382464051246643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,4,1,balanced,0.2937013308207194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,4,1,balanced,0.2947946588198344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,4,1,power_law_1.01,0.30820479393005373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,4,1,power_law_1.01,0.3120575904846191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,4,1,power_law_1.2,0.3016063928604126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,4,1,power_law_1.2,0.31166079044342043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,8,1,balanced,0.20455465714136759
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,8,1,balanced,0.2056480050086975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,8,1,power_law_1.01,0.20765440464019774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,8,1,power_law_1.01,0.20904319286346434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,8,1,power_law_1.2,0.21147520542144777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,14336,2,8,8,1,power_law_1.2,0.21833600997924804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,1,balanced,0.5173333485921224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,1,balanced,0.5188906590143839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,1,power_law_1.01,0.6271872043609619
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,1,power_law_1.01,0.6303808212280273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,1,power_law_1.2,0.6340991973876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,1,power_law_1.2,0.645747184753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,128,balanced,0.10609599947929382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,128,balanced,0.10661866267522176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,128,power_law_1.01,0.12319359779357911
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,128,power_law_1.01,0.12702080011367797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,128,power_law_1.2,0.14084479808807374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,128,power_law_1.2,0.14264960289001466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,16,balanced,0.12985600034395853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,16,balanced,0.12990400195121765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,16,power_law_1.01,0.15797120332717896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,16,power_law_1.01,0.16473599672317504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,16,power_law_1.2,0.17226239442825317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,16,power_law_1.2,0.17547520399093627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,2,balanced,0.2988266746203105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,2,balanced,0.2999093333880107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,2,power_law_1.01,0.38613119125366213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,2,power_law_1.01,0.3941823959350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,2,power_law_1.2,0.3975872039794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,2,power_law_1.2,0.4053631782531738
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,32,balanced,0.11691199739774068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,32,balanced,0.11755733688672383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,32,power_law_1.01,0.14060159921646118
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,32,power_law_1.01,0.1455296039581299
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,32,power_law_1.2,0.15362559556961058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,32,power_law_1.2,0.15614720582962036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,4,balanced,0.20193066199620566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,4,balanced,0.203167994817098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,4,power_law_1.01,0.2582848072052002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,4,power_law_1.01,0.2609407901763916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,4,power_law_1.2,0.264736008644104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,4,power_law_1.2,0.2784895896911621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,64,balanced,0.10911466677983601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,64,balanced,0.11088533202807109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,64,power_law_1.01,0.13097599744796753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,64,power_law_1.01,0.13593599796295167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,64,power_law_1.2,0.145632004737854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,64,power_law_1.2,0.14639359712600708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,8,balanced,0.15606932838757834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,8,balanced,0.15678399801254272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,8,power_law_1.01,0.188646399974823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,8,power_law_1.01,0.19228800535202026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,8,power_law_1.2,0.21240320205688476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,1,8,power_law_1.2,0.21477119922637938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,2,1,balanced,0.3447786569595337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,2,1,balanced,0.3460426727930705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,2,1,power_law_1.01,0.3986112117767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,2,1,power_law_1.01,0.40334720611572267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,2,1,power_law_1.2,0.40619521141052245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,2,1,power_law_1.2,0.40944638252258303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,4,1,balanced,0.273306667804718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,4,1,balanced,0.2752693295478821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,4,1,power_law_1.01,0.3065792083740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,4,1,power_law_1.01,0.30753920078277586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,4,1,power_law_1.2,0.3142656087875366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,4,1,power_law_1.2,0.3175935983657837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,8,1,balanced,0.24417599042256674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,8,1,balanced,0.24558399120966592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,8,1,power_law_1.01,0.27175040245056153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,8,1,power_law_1.01,0.2953088045120239
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,8,1,power_law_1.2,0.2717184066772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,4096,1536,8,128,8,1,power_law_1.2,0.29925758838653566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,1,balanced,1.6600213050842285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,1,balanced,1.6739840507507324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,1,power_law_1.01,1.792633628845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,1,power_law_1.01,1.8353151321411132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,1,power_law_1.2,1.7922687530517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,1,power_law_1.2,1.8044479370117188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,2,balanced,0.8710292975107828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,2,balanced,0.8735146522521973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,2,power_law_1.01,1.0897151947021484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,2,power_law_1.01,1.356608009338379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,2,power_law_1.2,1.2559103965759277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,2,power_law_1.2,1.3655360221862793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,4,balanced,0.48046398162841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,4,balanced,0.4839093287785848
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,4,power_law_1.01,0.862342357635498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,4,power_law_1.01,0.9280896186828613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,4,power_law_1.2,0.9122495651245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,4,power_law_1.2,0.9479680061340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,8,balanced,0.29335467020670575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,8,balanced,0.29640533526738483
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,8,power_law_1.01,0.8077247619628907
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,8,power_law_1.01,0.8212032318115234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,8,power_law_1.2,0.8051327705383301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,1,8,power_law_1.2,0.848755168914795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,16,1,balanced,0.2223680019378662
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,16,1,balanced,0.22334933280944824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,16,1,power_law_1.01,0.2304896116256714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,16,1,power_law_1.01,0.2357952117919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,16,1,power_law_1.2,0.22933120727539064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,16,1,power_law_1.2,0.23496320247650146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,2,1,balanced,0.750378688176473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,2,1,balanced,0.7537226676940918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,2,1,power_law_1.01,0.8027008056640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,2,1,power_law_1.01,0.8222399711608886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,2,1,power_law_1.2,0.7927487850189209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,2,1,power_law_1.2,0.8006591796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,32,1,balanced,0.18953599532445273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,32,1,balanced,0.1909493406613668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,32,1,power_law_1.01,0.19191039800643922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,32,1,power_law_1.01,0.1923840045928955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,32,1,power_law_1.2,0.1912384033203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,32,1,power_law_1.2,0.191539204120636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,4,1,balanced,0.4468640089035034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,4,1,balanced,0.4482986529668172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,4,1,power_law_1.01,0.48165121078491213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,4,1,power_law_1.01,0.485152006149292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,4,1,power_law_1.2,0.47927041053771974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,4,1,power_law_1.2,0.482374382019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,8,1,balanced,0.30027200778325397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,8,1,balanced,0.30107732613881427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,8,1,power_law_1.01,0.30801920890808104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,8,1,power_law_1.01,0.32245759963989257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,8,1,power_law_1.2,0.31480319499969484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,16384,2,8,8,1,power_law_1.2,0.31505279541015624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,1,balanced,1.3574879964192708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,1,balanced,1.3603307406107585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,1,power_law_1.01,1.614182472229004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,1,power_law_1.01,1.6343040466308594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,1,power_law_1.2,1.6538688659667968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,1,power_law_1.2,1.6729728698730468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,128,balanced,0.14852799971898398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,128,balanced,0.14909332990646362
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,128,power_law_1.01,0.16705280542373657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,128,power_law_1.01,0.17076480388641357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,128,power_law_1.2,0.1831104040145874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,128,power_law_1.2,0.18561919927597045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,16,balanced,0.2013333241144816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,16,balanced,0.20175999402999878
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,16,power_law_1.01,0.24588160514831542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,16,power_law_1.01,0.2467967987060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,16,power_law_1.2,0.26788480281829835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,16,power_law_1.2,0.27936639785766604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,2,balanced,0.6079786618550619
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,2,balanced,0.6081813176472982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,2,power_law_1.01,0.8375167846679688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,2,power_law_1.01,0.861574363708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,2,power_law_1.2,0.8817855834960937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,2,power_law_1.2,0.8980863571166993
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,256,balanced,0.14732266465822855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,256,balanced,0.1476693352063497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,256,power_law_1.01,0.15754879713058473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,256,power_law_1.01,0.15882879495620728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,256,power_law_1.2,0.17582080364227295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,256,power_law_1.2,0.17955199480056763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,32,balanced,0.17303999265034994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,32,balanced,0.17324799299240112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,32,power_law_1.01,0.2142848014831543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,32,power_law_1.01,0.21709439754486085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,32,power_law_1.2,0.22294399738311768
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,32,power_law_1.2,0.23243520259857178
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,4,balanced,0.370410680770874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,4,balanced,0.3712533315022786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,4,power_law_1.01,0.4853695869445801
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,4,power_law_1.01,0.5155136108398437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,4,power_law_1.2,0.5640192031860352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,4,power_law_1.2,0.5839231967926025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,64,balanced,0.15665599703788757
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,64,balanced,0.1581546664237976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,64,power_law_1.01,0.18156800270080567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,64,power_law_1.01,0.1941375970840454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,64,power_law_1.2,0.19511040449142455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,64,power_law_1.2,0.2034559965133667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,8,balanced,0.2579360008239746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,8,balanced,0.25836799542109173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,8,power_law_1.01,0.3312191963195801
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,8,power_law_1.01,0.3368704080581665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,8,power_law_1.2,0.36323840618133546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,1,8,power_law_1.2,0.3737792015075684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,16,1,balanced,0.3802186648050944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,16,1,balanced,0.38045867284138996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,16,1,power_law_1.01,0.4185919761657715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,16,1,power_law_1.01,0.4707071781158447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,16,1,power_law_1.2,0.4186367988586426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,16,1,power_law_1.2,0.48214402198791506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,2,1,balanced,0.7869439919789633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,2,1,balanced,0.7884213129679362
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,2,1,power_law_1.01,0.9171775817871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,2,1,power_law_1.01,0.9188096046447753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,2,1,power_law_1.2,0.9424320220947265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,2,1,power_law_1.2,0.9464575767517089
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,32,1,balanced,0.3930613199869792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,32,1,balanced,0.42395198345184326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,32,1,power_law_1.01,0.4369472026824951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,32,1,power_law_1.01,0.4981247901916504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,32,1,power_law_1.2,0.44440321922302245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,32,1,power_law_1.2,0.4481664180755615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,4,1,balanced,0.5128426551818848
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,4,1,balanced,0.5131093263626099
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,4,1,power_law_1.01,0.571398401260376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,4,1,power_law_1.01,0.5731071949005127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,4,1,power_law_1.2,0.5850880146026611
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,4,1,power_law_1.2,0.5857471942901611
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,8,1,balanced,0.41473066806793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,8,1,balanced,0.4633013407389323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,8,1,power_law_1.01,0.4584191799163818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,8,1,power_law_1.01,0.45932798385620116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,8,1,power_law_1.2,0.4639167785644531
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2048,8,256,8,1,power_law_1.2,0.46450557708740237
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,1,balanced,1.9626773198445637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,1,balanced,1.9638080596923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,1,power_law_1.01,1.490227222442627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,1,power_law_1.01,1.5294591903686523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,1,power_law_1.2,1.5387328147888184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,1,power_law_1.2,1.5590335845947265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,16,balanced,0.2113973299662272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,16,balanced,0.21141332387924194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,16,power_law_1.01,0.279257607460022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,16,power_law_1.01,0.28545920848846434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,16,power_law_1.2,0.29796481132507324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,16,power_law_1.2,0.30259199142456056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,2,balanced,0.8163039684295654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,2,balanced,0.8172266483306885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,2,power_law_1.01,0.8568256378173829
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,2,power_law_1.01,0.8605631828308106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,2,power_law_1.2,0.9476863861083984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,2,power_law_1.2,0.9650752067565918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,32,balanced,0.1751520037651062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,32,balanced,0.1759893298149109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,32,power_law_1.01,0.22641279697418212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,32,power_law_1.01,0.22688000202178954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,32,power_law_1.2,0.26058239936828614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,32,power_law_1.2,0.2756416082382202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,4,balanced,0.4113440116246541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,4,balanced,0.41311999162038165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,4,power_law_1.01,0.5126719951629639
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,4,power_law_1.01,0.5421823978424072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,4,power_law_1.2,0.6071231842041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,4,power_law_1.2,0.6232128143310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,8,balanced,0.2749333381652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,8,balanced,0.2751893401145935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,8,power_law_1.01,0.3534976005554199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,8,power_law_1.01,0.3655936002731323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,8,power_law_1.2,0.37056000232696534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,1,8,power_law_1.2,0.40254721641540525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,2,1,balanced,1.097872018814087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,2,1,balanced,1.1169333457946777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,2,1,power_law_1.01,0.8660672187805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,2,1,power_law_1.01,0.8679424285888672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,2,1,power_law_1.2,0.884716796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,2,1,power_law_1.2,0.8909248352050781
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,4,1,balanced,0.6802720228830973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,4,1,balanced,0.6813440322875977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,4,1,power_law_1.01,0.5562431812286377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,4,1,power_law_1.01,0.5576128005981446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,4,1,power_law_1.2,0.5702079772949219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,4,1,power_law_1.2,0.5756415843963623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,8,1,balanced,0.5129439830780029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,8,1,balanced,0.5138880014419556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,8,1,power_law_1.01,0.439635181427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,8,1,power_law_1.01,0.448576021194458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,8,1,power_law_1.2,0.45285758972167967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,6144,2560,8,160,8,1,power_law_1.2,0.45559039115905764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,1,balanced,1.5602347056070964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,1,balanced,1.5983840624491374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,1,power_law_1.01,1.8880512237548828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,1,power_law_1.01,1.8926719665527343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,1,power_law_1.2,1.9525632858276367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,1,power_law_1.2,1.964543914794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,128,balanced,0.1687999963760376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,128,balanced,0.16943466663360596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,128,power_law_1.01,0.19302400350570678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,128,power_law_1.01,0.1963520050048828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,128,power_law_1.2,0.20911359786987305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,128,power_law_1.2,0.21581439971923827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,16,balanced,0.22950933376948038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,16,balanced,0.2300586700439453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,16,power_law_1.01,0.27696640491485597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,16,power_law_1.01,0.2807424068450928
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,16,power_law_1.2,0.30373759269714357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,16,power_law_1.2,0.3144320011138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,2,balanced,0.7046026388804117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,2,balanced,0.7068479855855306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,2,power_law_1.01,0.9641152381896972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,2,power_law_1.01,0.9683199882507324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,2,power_law_1.2,0.9997376441955567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,2,power_law_1.2,1.0302335739135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,256,balanced,0.16632533073425293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,256,balanced,0.16673600673675537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,256,power_law_1.01,0.1801151990890503
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,256,power_law_1.01,0.18044159412384034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,256,power_law_1.2,0.19998079538345337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,256,power_law_1.2,0.20647039413452148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,32,balanced,0.19571733474731445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,32,balanced,0.1963626742362976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,32,power_law_1.01,0.24264960289001464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,32,power_law_1.01,0.2465343952178955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,32,power_law_1.2,0.25499520301818845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,32,power_law_1.2,0.2635456085205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,4,balanced,0.42818665504455566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,4,balanced,0.4285759925842285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,4,power_law_1.01,0.5560639858245849
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,4,power_law_1.01,0.5783552169799805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,4,power_law_1.2,0.5989759922027588
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,4,power_law_1.2,0.606879997253418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,64,balanced,0.17877866824467978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,64,balanced,0.1805866758028666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,64,power_law_1.01,0.2074431896209717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,64,power_law_1.01,0.21056001186370848
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,64,power_law_1.2,0.2273087978363037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,64,power_law_1.2,0.22773759365081786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,8,balanced,0.29499200979868573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,8,balanced,0.29532267649968463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,8,power_law_1.01,0.3765887975692749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,8,power_law_1.01,0.39098238945007324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,8,power_law_1.2,0.4079296112060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,1,8,power_law_1.2,0.40928001403808595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,16,1,balanced,0.43678398927052814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,16,1,balanced,0.4373493194580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,16,1,power_law_1.01,0.47930240631103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,16,1,power_law_1.01,0.48047361373901365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,16,1,power_law_1.2,0.48271999359130857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,16,1,power_law_1.2,0.48659839630126955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,2,1,balanced,0.9114720026652018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,2,1,balanced,0.9137600262959799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,2,1,power_law_1.01,1.0667903900146485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,2,1,power_law_1.01,1.0804800033569335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,2,1,power_law_1.2,1.0929599761962892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,2,1,power_law_1.2,1.0952704429626465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,32,1,balanced,0.44922133286794025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,32,1,balanced,0.45005865891774494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,32,1,power_law_1.01,0.5048960208892822
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,32,1,power_law_1.01,0.574015998840332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,32,1,power_law_1.2,0.5163392066955567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,32,1,power_law_1.2,0.5498752117156982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,4,1,balanced,0.5912053187688192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,4,1,balanced,0.5925173362096151
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,4,1,power_law_1.01,0.6611135959625244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,4,1,power_law_1.01,0.6681215763092041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,4,1,power_law_1.2,0.6809599876403809
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,4,1,power_law_1.2,0.683519983291626
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,8,1,balanced,0.4776906569798787
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,8,1,balanced,0.4808586835861206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,8,1,power_law_1.01,0.5273151874542237
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,8,1,power_law_1.01,0.5948544025421143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,8,1,power_law_1.2,0.5365183830261231
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,256,8,1,power_law_1.2,0.5392576217651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,1,balanced,2.930805206298828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,1,balanced,3.1604159673055015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,1,power_law_1.01,2.1536319732666014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,1,power_law_1.01,2.2104703903198244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,1,power_law_1.2,2.3176639556884764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,1,power_law_1.2,2.3290048599243165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,128,balanced,0.17087999979654947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,128,balanced,0.1748639941215515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,128,power_law_1.01,0.19041919708251953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,128,power_law_1.01,0.1938431978225708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,128,power_law_1.2,0.20632319450378417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,128,power_law_1.2,0.20638079643249513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,16,balanced,0.26339733600616455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,16,balanced,0.2635093331336975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,16,power_law_1.01,0.2979007959365845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,16,power_law_1.01,0.30850560665130616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,16,power_law_1.2,0.3126015901565552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,16,power_law_1.2,0.327839994430542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,2,balanced,1.2596746285756428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,2,balanced,1.2653760115305583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,2,power_law_1.01,1.170751953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,2,power_law_1.01,1.2203968048095704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,2,power_law_1.2,1.2743616104125977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,2,power_law_1.2,1.2919743537902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,32,balanced,0.21125332514444986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,32,balanced,0.2127466599146525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,32,power_law_1.01,0.2388223886489868
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,32,power_law_1.01,0.24096639156341554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,32,power_law_1.2,0.2542527914047241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,32,power_law_1.2,0.2599168062210083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,4,balanced,0.5478773514429728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,4,balanced,0.5480159918467203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,4,power_law_1.01,0.6476352214813232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,4,power_law_1.01,0.6876671791076661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,4,power_law_1.2,0.7262144088745117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,4,power_law_1.2,0.7539904117584229
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,64,balanced,0.18890666961669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,64,balanced,0.18946133057276407
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,64,power_law_1.01,0.20968959331512452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,64,power_law_1.01,0.21077120304107666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,64,power_law_1.2,0.22519679069519044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,64,power_law_1.2,0.22992000579833985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,8,balanced,0.35734931627909344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,8,balanced,0.35788265864054364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,8,power_law_1.01,0.4289408206939697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,8,power_law_1.01,0.4332479953765869
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,8,power_law_1.2,0.4667327880859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,1,8,power_law_1.2,0.48659839630126955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,16,1,balanced,0.5419626633326212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,16,1,balanced,0.5433973471323649
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,16,1,power_law_1.01,0.512883186340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,16,1,power_law_1.01,0.5500288009643555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,16,1,power_law_1.2,0.5232192039489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,16,1,power_law_1.2,0.6015679836273193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,2,1,balanced,1.3957707087198894
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,2,1,balanced,1.503328005472819
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,2,1,power_law_1.01,1.2204928398132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,2,1,power_law_1.01,1.2347455978393556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,2,1,power_law_1.2,1.262515163421631
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,2,1,power_law_1.2,1.2963135719299317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,32,1,balanced,0.5386506716410319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,32,1,balanced,0.53984534740448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,32,1,power_law_1.01,0.539795207977295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,32,1,power_law_1.01,0.5429952144622803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,32,1,power_law_1.2,0.5455679893493652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,32,1,power_law_1.2,0.5572927951812744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,4,1,balanced,0.8336586952209473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,4,1,balanced,0.8341173330942789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,4,1,power_law_1.01,0.7411903858184814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,4,1,power_law_1.01,0.7442495822906494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,4,1,power_law_1.2,0.7732096195220948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,4,1,power_law_1.2,0.7776832103729248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,8,1,balanced,0.6294026772181193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,8,1,balanced,0.6300319830576578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,8,1,power_law_1.01,0.5724991798400879
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,8,1,power_law_1.01,0.6455935955047607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,8,1,power_law_1.2,0.5907839775085449
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,4096,7168,2048,8,384,8,1,power_law_1.2,0.5914815902709961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,1,balanced,0.08264533181985219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,1,balanced,0.08270399769147237
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,1,power_law_1.01,0.0745024025440216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,1,power_law_1.01,0.07580159902572632
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,1,power_law_1.2,0.07363839745521546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,1,power_law_1.2,0.07371519804000855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,128,balanced,0.03366400053103765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,128,balanced,0.03538133452335993
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,128,power_law_1.01,0.032467201352119446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,128,power_law_1.01,0.0333759993314743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,128,power_law_1.2,0.03196159899234772
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,128,power_law_1.2,0.03288959860801697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,16,balanced,0.03154666721820831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,16,balanced,0.031557333966096245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,16,power_law_1.01,0.029772800207138062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,16,power_law_1.01,0.029862400889396668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,16,power_law_1.2,0.03017599880695343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,16,power_law_1.2,0.030579200387001036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,2,balanced,0.057760000228881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,2,balanced,0.0583840012550354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,2,power_law_1.01,0.05321599841117859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,2,power_law_1.01,0.05421440005302429
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,2,power_law_1.2,0.053855997323989865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,2,power_law_1.2,0.05444480180740356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,32,balanced,0.02943466603755951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,32,balanced,0.03133333226044973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,32,power_law_1.01,0.02839039862155914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,32,power_law_1.01,0.029183998703956604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,32,power_law_1.2,0.027289599180221558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,32,power_law_1.2,0.02839680016040802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,4,balanced,0.03685333331425985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,4,balanced,0.03793066740036011
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,4,power_law_1.01,0.03591040074825287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,4,power_law_1.01,0.03726080060005188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,4,power_law_1.2,0.036582401394844054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,4,power_law_1.2,0.037574398517608645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,64,balanced,0.033626665671666466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,64,balanced,0.0356480007370313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,64,power_law_1.01,0.0328000009059906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,64,power_law_1.01,0.03416320085525513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,64,power_law_1.2,0.03266560137271881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,64,power_law_1.2,0.033055999875068666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,8,balanced,0.03160533308982849
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,8,balanced,0.032261334359645844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,8,power_law_1.01,0.029760000109672547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,8,power_law_1.01,0.0304639995098114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,8,power_law_1.2,0.031353598833084105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,1,8,power_law_1.2,0.0318015992641449
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,2,1,balanced,0.0598880002895991
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,2,1,balanced,0.0602400004863739
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,2,1,power_law_1.01,0.054502397775650024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,2,1,power_law_1.01,0.05489919781684875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,2,1,power_law_1.2,0.05484799742698669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,2,1,power_law_1.2,0.05490559935569763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,4,1,balanced,0.04046933352947235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,4,1,balanced,0.04159999887148539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,4,1,power_law_1.01,0.03825919926166534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,4,1,power_law_1.01,0.03874559998512268
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,4,1,power_law_1.2,0.03989759981632233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,2048,768,8,128,4,1,power_law_1.2,0.03994239866733551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,1,balanced,0.31035733222961426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,1,balanced,0.31169599294662476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,1,power_law_1.01,0.23177599906921387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,1,power_law_1.01,0.23210880756378174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,1,power_law_1.2,0.22670719623565674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,1,power_law_1.2,0.22731521129608154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,128,balanced,0.03766933331886927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,128,balanced,0.03941866755485535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,128,power_law_1.01,0.03686400055885315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,128,power_law_1.01,0.03751679956912994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,128,power_law_1.2,0.03646720051765442
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,128,power_law_1.2,0.03660799860954285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,16,balanced,0.049973333875338234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,16,balanced,0.05156800150871277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,16,power_law_1.01,0.04399999976158142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,16,power_law_1.01,0.0459199994802475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,16,power_law_1.2,0.04650880098342895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,16,power_law_1.2,0.04718720018863678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,2,balanced,0.17127466201782227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,2,balanced,0.17314666509628296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,2,power_law_1.01,0.1352959990501404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,2,power_law_1.01,0.1356735944747925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,2,power_law_1.2,0.1337280035018921
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,2,power_law_1.2,0.13393919467926024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,256,balanced,0.0377866675456365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,256,balanced,0.037791999677817024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,256,power_law_1.01,0.03436160087585449
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,256,power_law_1.01,0.03550080060958862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,256,power_law_1.2,0.03427839875221252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,256,power_law_1.2,0.03532800078392029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,32,balanced,0.03628266602754593
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,32,balanced,0.0365280012289683
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,32,power_law_1.01,0.03261440098285675
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,32,power_law_1.01,0.03473919928073883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,32,power_law_1.2,0.0332863986492157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,32,power_law_1.2,0.03374719917774201
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,4,balanced,0.10312533378601074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,4,balanced,0.10357333223025005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,4,power_law_1.01,0.09127680063247681
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,4,power_law_1.01,0.09292799830436707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,4,power_law_1.2,0.08698239922523499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,4,power_law_1.2,0.09318400025367737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,64,balanced,0.033615998923778534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,64,balanced,0.033813332517941795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,64,power_law_1.01,0.031763198971748355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,64,power_law_1.01,0.03367680013179779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,64,power_law_1.2,0.03253119885921478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,64,power_law_1.2,0.032601600885391234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,8,balanced,0.06881066660086314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,8,balanced,0.06901866694291432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,8,power_law_1.01,0.061843198537826535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,8,power_law_1.01,0.062463998794555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,8,power_law_1.2,0.05615360140800476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,1,8,power_law_1.2,0.06056320071220398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,2,1,balanced,0.17628800868988037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,2,1,balanced,0.17680533727010092
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,2,1,power_law_1.01,0.1331264019012451
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,2,1,power_law_1.01,0.1340288043022156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,2,1,power_law_1.2,0.13200639486312865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,2,1,power_law_1.2,0.13322240114212036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,4,1,balanced,0.10955733060836792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,4,1,balanced,0.10963732997576396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,4,1,power_law_1.01,0.08492159843444824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,4,1,power_law_1.01,0.08848639726638793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,4,1,power_law_1.2,0.08398720026016235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,4,1,power_law_1.2,0.08548480272293091
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,8,1,balanced,0.08037866652011871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,8,1,balanced,0.08052800099054973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,8,1,power_law_1.01,0.06686080098152161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,8,1,power_law_1.01,0.06707839965820313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,8,1,power_law_1.2,0.0643775999546051
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,3072,1536,8,256,8,1,power_law_1.2,0.06598399877548218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,1,balanced,0.1753173271814982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,1,balanced,0.17537067333857217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,1,power_law_1.01,0.17615360021591187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,1,power_law_1.01,0.1786687970161438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,1,power_law_1.2,0.17562240362167358
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,1,power_law_1.2,0.17675520181655885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,2,balanced,0.0869653324286143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,2,balanced,0.0883893370628357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,2,power_law_1.01,0.09765120148658753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,2,power_law_1.01,0.0981760025024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,2,power_law_1.2,0.09466879963874816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,2,power_law_1.2,0.09750400185585022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,4,balanced,0.0646666685740153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,4,balanced,0.06596266726652782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,4,power_law_1.01,0.06335359811782837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,4,power_law_1.01,0.0651968002319336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,4,power_law_1.2,0.06530560255050659
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,4,power_law_1.2,0.06647040247917176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,8,balanced,0.056074668963750206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,8,balanced,0.056261335810025535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,8,power_law_1.01,0.053299200534820554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,8,power_law_1.01,0.05490559935569763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,8,power_law_1.2,0.05360640287399292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,1,8,power_law_1.2,0.05454720258712768
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,16,1,balanced,0.033600000043710075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,16,1,balanced,0.03374933451414108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,16,1,power_law_1.01,0.031865599751472476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,16,1,power_law_1.01,0.033055999875068666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,16,1,power_law_1.2,0.031641599535942075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,16,1,power_law_1.2,0.032051199674606325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,2,1,balanced,0.09705600142478943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,2,1,balanced,0.09946133693059285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,2,1,power_law_1.01,0.09909120202064514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,2,1,power_law_1.01,0.09969919919967651
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,2,1,power_law_1.2,0.09975039958953857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,2,1,power_law_1.2,0.10039039850234985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,32,1,balanced,0.02951466788848241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,32,1,balanced,0.030613332986831665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,32,1,power_law_1.01,0.02805120050907135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,32,1,power_law_1.01,0.02890239953994751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,32,1,power_law_1.2,0.028460800647735596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,32,1,power_law_1.2,0.0290367990732193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,4,1,balanced,0.06503466765085857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,4,1,balanced,0.06638399759928386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,4,1,power_law_1.01,0.06340479850769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,4,1,power_law_1.01,0.0650816023349762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,4,1,power_law_1.2,0.06304640173912049
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,4,1,power_law_1.2,0.06310399770736694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,8,1,balanced,0.04754666487375895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,8,1,balanced,0.04791999856630961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,8,1,power_law_1.01,0.04517120122909546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,8,1,power_law_1.01,0.045388799905776975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,8,1,power_law_1.2,0.04519039988517761
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,14336,2,8,8,1,power_law_1.2,0.046035200357437134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,1,balanced,0.22162665923436484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,1,balanced,0.22267200549443564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,1,power_law_1.01,0.19915519952774047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,1,power_law_1.01,0.2011712074279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,1,power_law_1.2,0.19983999729156493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,1,power_law_1.2,0.1999616026878357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,128,balanced,0.03793599953254064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,128,balanced,0.03945599993069967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,128,power_law_1.01,0.03722879886627197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,128,power_law_1.01,0.03731839954853058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,128,power_law_1.2,0.03616639971733093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,128,power_law_1.2,0.037401598691940305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,16,balanced,0.037733333806196846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,16,balanced,0.0397173340121905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,16,power_law_1.01,0.0377023994922638
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,16,power_law_1.01,0.039155200123786926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,16,power_law_1.2,0.03891839981079102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,16,power_law_1.2,0.039801600575447085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,2,balanced,0.12783466776212057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,2,balanced,0.1281066636244456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,2,power_law_1.01,0.11436799764633179
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,2,power_law_1.01,0.11461119651794434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,2,power_law_1.2,0.11576319932937622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,2,power_law_1.2,0.11631360054016113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,32,balanced,0.03538133452335993
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,32,balanced,0.03562666724125544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,32,power_law_1.01,0.033228799700737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,32,power_law_1.01,0.03338879942893982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,32,power_law_1.2,0.033011201024055484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,32,power_law_1.2,0.03330560028553009
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,4,balanced,0.08079466720422109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,4,balanced,0.08136000235875447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,4,power_law_1.01,0.07409279942512512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,4,power_law_1.01,0.07589120268821717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,4,power_law_1.2,0.07363200187683105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,4,power_law_1.2,0.07657600045204163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,64,balanced,0.03972800076007843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,64,balanced,0.04152533411979675
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,64,power_law_1.01,0.03768959939479828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,64,power_law_1.01,0.039103999733924866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,64,power_law_1.2,0.038899201154708865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,64,power_law_1.2,0.039526399970054624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,8,balanced,0.05824000140031179
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,8,balanced,0.059450666109720864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,8,power_law_1.01,0.053376001119613645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,8,power_law_1.01,0.05548160076141358
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,8,power_law_1.2,0.05485439896583557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,1,8,power_law_1.2,0.055769598484039305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,2,1,balanced,0.1299253304799398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,2,1,balanced,0.13129066427548727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,2,1,power_law_1.01,0.11759359836578369
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,2,1,power_law_1.01,0.11909760236740112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,2,1,power_law_1.2,0.11843839883804322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,2,1,power_law_1.2,0.11861120462417603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,4,1,balanced,0.08478933572769165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,4,1,balanced,0.08523733417193095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,4,1,power_law_1.01,0.0763647973537445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,4,1,power_law_1.01,0.07685760259628296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,4,1,power_law_1.2,0.07667199969291687
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,4,1,power_law_1.2,0.07864320278167725
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,8,1,balanced,0.06410666803518932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,8,1,balanced,0.0649599979321162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,8,1,power_law_1.01,0.060755199193954466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,8,1,power_law_1.01,0.06152960062026978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,8,1,power_law_1.2,0.06083199977874756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,4096,1536,8,128,8,1,power_law_1.2,0.06124160289764404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,1,balanced,0.354362686475118
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,1,balanced,0.35442666212717694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,1,power_law_1.01,0.33011839389801023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,1,power_law_1.01,0.33639039993286135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,1,power_law_1.2,0.34218881130218504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,1,power_law_1.2,0.34282240867614744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,2,balanced,0.1299626628557841
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,2,balanced,0.13083733121554056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,2,power_law_1.01,0.14780160188674926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,2,power_law_1.01,0.16252800226211547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,2,power_law_1.2,0.15681920051574708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,2,power_law_1.2,0.16357760429382323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,4,balanced,0.08288000027338664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,4,balanced,0.0846720039844513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,4,power_law_1.01,0.08554880023002624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,4,power_law_1.01,0.09007999897003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,4,power_law_1.2,0.08957440257072449
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,4,power_law_1.2,0.09352319836616516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,8,balanced,0.07069333394368489
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,8,balanced,0.07193066676457723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,8,power_law_1.01,0.06607360243797303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,8,power_law_1.01,0.06739839911460876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,8,power_law_1.2,0.06638079881668091
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,1,8,power_law_1.2,0.0679423987865448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,16,1,balanced,0.04309333364168803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,16,1,balanced,0.04340800146261851
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,16,1,power_law_1.01,0.04053759872913361
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,16,1,power_law_1.01,0.04079360067844391
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,16,1,power_law_1.2,0.04025599956512451
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,16,1,power_law_1.2,0.04058879911899567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,2,1,balanced,0.1426346699396769
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,2,1,balanced,0.14492266376813254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,2,1,power_law_1.01,0.14832639694213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,2,1,power_law_1.01,0.1490496039390564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,2,1,power_law_1.2,0.15128320455551147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,2,1,power_law_1.2,0.15171200037002563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,32,1,balanced,0.03147733211517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,32,1,balanced,0.033626665671666466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,32,1,power_law_1.01,0.03123840093612671
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,32,1,power_law_1.01,0.03159680068492889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,32,1,power_law_1.2,0.030502399802207945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,32,1,power_law_1.2,0.030649599432945252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,4,1,balanced,0.08708799878756206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,4,1,balanced,0.08825600147247314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,4,1,power_law_1.01,0.08596479892730713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,4,1,power_law_1.01,0.08996480107307434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,4,1,power_law_1.2,0.08776959776878357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,4,1,power_law_1.2,0.08823680281639099
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,8,1,balanced,0.05909333129723867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,8,1,balanced,0.060122668743133545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,8,1,power_law_1.01,0.058534401655197146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,8,1,power_law_1.01,0.05869439840316772
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,8,1,power_law_1.2,0.057760000228881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,16384,2,8,8,1,power_law_1.2,0.05826560258865356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,1,balanced,0.7699999809265137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,1,balanced,0.7712799708048502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,1,power_law_1.01,0.5511551856994629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,1,power_law_1.01,0.5622144222259522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,1,power_law_1.2,0.5530687808990479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,1,power_law_1.2,0.5536896228790283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,128,balanced,0.04622933268547058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,128,balanced,0.047930667797724404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,128,power_law_1.01,0.04469760060310364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,128,power_law_1.01,0.04650880098342895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,128,power_law_1.2,0.045100799202919005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,128,power_law_1.2,0.045440000295639035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,16,balanced,0.080485333998998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,16,balanced,0.08241599798202515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,16,power_law_1.01,0.07448319792747497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,16,power_law_1.01,0.07560319900512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,16,power_law_1.2,0.07322239875793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,16,power_law_1.2,0.07675520181655884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,2,balanced,0.40245866775512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,2,balanced,0.40304001172383624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,2,power_law_1.01,0.3117824077606201
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,2,power_law_1.01,0.314246392250061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,2,power_law_1.2,0.32211201190948485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,2,power_law_1.2,0.3248192071914673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,256,balanced,0.04181333382924398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,256,balanced,0.0418453315893809
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,256,power_law_1.01,0.04089600145816803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,256,power_law_1.01,0.04129279851913452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,256,power_law_1.2,0.040268799662590025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,256,power_law_1.2,0.0404992014169693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,32,balanced,0.05890666445096334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,32,balanced,0.05909333129723867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,32,power_law_1.01,0.055379199981689456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,32,power_law_1.01,0.05612800121307373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,32,power_law_1.2,0.05431680083274841
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,32,power_law_1.2,0.054585599899291994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,4,balanced,0.21753066778182983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,4,balanced,0.21887999773025513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,4,power_law_1.01,0.1548416018486023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,4,power_law_1.01,0.16433279514312743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,4,power_law_1.2,0.18008960485458375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,4,power_law_1.2,0.2050879955291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,64,balanced,0.04374399781227112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,64,balanced,0.04484800000985464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,64,power_law_1.01,0.040524798631668094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,64,power_law_1.01,0.04131200015544891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,64,power_law_1.2,0.03993600010871887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,64,power_law_1.2,0.04172160029411316
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,8,balanced,0.12717866897583008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,8,balanced,0.1283253331979116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,8,power_law_1.01,0.10927360057830811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,8,power_law_1.01,0.11866240501403809
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,8,power_law_1.2,0.10402560234069824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,1,8,power_law_1.2,0.10706559419631959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,16,1,balanced,0.10556800166765849
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,16,1,balanced,0.10637866457303365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,16,1,power_law_1.01,0.08540160059928895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,16,1,power_law_1.01,0.08574079871177673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,16,1,power_law_1.2,0.08475520014762879
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,16,1,power_law_1.2,0.08540160059928895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,2,1,balanced,0.4037439823150635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,2,1,balanced,0.40533868471781415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,2,1,power_law_1.01,0.2916928052902222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,2,1,power_law_1.01,0.30079360008239747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,2,1,power_law_1.2,0.2913599967956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,2,1,power_law_1.2,0.2983167886734009
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,32,1,balanced,0.0886293351650238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,32,1,balanced,0.08873066306114197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,32,1,power_law_1.01,0.07417600154876709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,32,1,power_law_1.01,0.07482879757881164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,32,1,power_law_1.2,0.07383040189743043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,32,1,power_law_1.2,0.0750656008720398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,4,1,balanced,0.22383999824523926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,4,1,balanced,0.22427199284235635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,4,1,power_law_1.01,0.1672063946723938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,4,1,power_law_1.01,0.16927360296249389
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,4,1,power_law_1.2,0.16628479957580566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,4,1,power_law_1.2,0.16944639682769774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,8,1,balanced,0.13806399703025818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,8,1,balanced,0.13974400361378989
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,8,1,power_law_1.01,0.10750080347061157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,8,1,power_law_1.01,0.10920319557189942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,8,1,power_law_1.2,0.10910719633102417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2048,8,256,8,1,power_law_1.2,0.10915199518203736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,1,balanced,0.6114559968312582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,1,balanced,0.61190398534139
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,1,power_law_1.01,0.5100607872009277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,1,power_law_1.01,0.5105023860931397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,1,power_law_1.2,0.5013567924499511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,1,power_law_1.2,0.5045887947082519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,16,balanced,0.07147733370463054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,16,balanced,0.07211733361085255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,16,power_law_1.01,0.06958079934120179
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,16,power_law_1.01,0.07043200135231018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,16,power_law_1.2,0.06928640007972717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,16,power_law_1.2,0.07109760046005249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,2,balanced,0.3237973252932231
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,2,balanced,0.32472000519434613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,2,power_law_1.01,0.27306880950927737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,2,power_law_1.01,0.28624639511108396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,2,power_law_1.2,0.2758336067199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,2,power_law_1.2,0.27630081176757815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,32,balanced,0.059802666306495667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,32,balanced,0.05981333553791046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,32,power_law_1.01,0.05677440166473389
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,32,power_law_1.01,0.059680002927780154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,32,power_law_1.2,0.0546176016330719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,32,power_law_1.2,0.05707520246505737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,4,balanced,0.17924267053604126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,4,balanced,0.17989865938822427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,4,power_law_1.01,0.15497599840164183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,4,power_law_1.01,0.15934720039367675
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,4,power_law_1.2,0.15203839540481567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,4,power_law_1.2,0.1558079957962036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,8,balanced,0.10726400216420491
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,8,balanced,0.10850666960080464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,8,power_law_1.01,0.09755520224571228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,8,power_law_1.01,0.10026880502700805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,8,power_law_1.2,0.09715200066566468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,1,8,power_law_1.2,0.09807360172271729
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,2,1,balanced,0.32442132631937665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,2,1,balanced,0.3263840079307556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,2,1,power_law_1.01,0.27238399982452394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,2,1,power_law_1.01,0.2724096059799194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,2,1,power_law_1.2,0.2710911989212036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,2,1,power_law_1.2,0.27859840393066404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,4,1,balanced,0.1885813275973002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,4,1,balanced,0.19016534090042114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,4,1,power_law_1.01,0.16122879981994628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,4,1,power_law_1.01,0.1628224015235901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,4,1,power_law_1.2,0.16072319746017455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,4,1,power_law_1.2,0.16599040031433104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,8,1,balanced,0.11458667119344075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,8,1,balanced,0.11505599816640218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,8,1,power_law_1.01,0.09920639991760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,8,1,power_law_1.01,0.10005760192871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,8,1,power_law_1.2,0.10043519735336304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,6144,2560,8,160,8,1,power_law_1.2,0.10085120201110839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,1,balanced,0.902949333190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,1,balanced,0.9031573136647543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,1,power_law_1.01,0.6517248153686523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,1,power_law_1.01,0.6543104171752929
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,1,power_law_1.2,0.6447296142578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,1,power_law_1.2,0.6475647926330567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,128,balanced,0.08322666585445404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,128,balanced,0.08878399928410848
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,128,power_law_1.01,0.08072959780693054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,128,power_law_1.01,0.08315520286560059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,128,power_law_1.2,0.08062080144882203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,128,power_law_1.2,0.08417919874191285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,16,balanced,0.09290132919947307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,16,balanced,0.09291199843088786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,16,power_law_1.01,0.08451840281486511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,16,power_law_1.01,0.09100800156593322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,16,power_law_1.2,0.07752320170402527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,16,power_law_1.2,0.08325759768486023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,2,balanced,0.4699466625849406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,2,balanced,0.4710400104522705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,2,power_law_1.01,0.38109440803527833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,2,power_law_1.01,0.38495359420776365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,2,power_law_1.2,0.3590143918991089
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,2,power_law_1.2,0.3790015935897827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,256,balanced,0.06074133515357971
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,256,balanced,0.06247999767462412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,256,power_law_1.01,0.05542399883270264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,256,power_law_1.01,0.06294400095939637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,256,power_law_1.2,0.055340802669525145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,256,power_law_1.2,0.05578879714012146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,32,balanced,0.06345599889755249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,32,balanced,0.06491200129191081
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,32,power_law_1.01,0.05911039710044861
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,32,power_law_1.01,0.0606656014919281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,32,power_law_1.2,0.05869439840316772
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,32,power_law_1.2,0.061408001184463504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,4,balanced,0.2535253365834554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,4,balanced,0.2550560037295024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,4,power_law_1.01,0.21239678859710692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,4,power_law_1.01,0.22540159225463868
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,4,power_law_1.2,0.20993280410766602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,4,power_law_1.2,0.21850240230560303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,64,balanced,0.06674133241176605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,64,balanced,0.07066666583220164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,64,power_law_1.01,0.058771198987960814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,64,power_law_1.01,0.061286401748657224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,64,power_law_1.2,0.062438398599624634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,64,power_law_1.2,0.06366080045700073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,8,balanced,0.14753066500027975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,8,balanced,0.14843199650446573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,8,power_law_1.01,0.11994240283966065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,8,power_law_1.01,0.12779519557952881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,8,power_law_1.2,0.11929600238800049
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,1,8,power_law_1.2,0.12407040596008301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,16,1,balanced,0.11914133032162984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,16,1,balanced,0.12145066261291504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,16,1,power_law_1.01,0.09741439819335937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,16,1,power_law_1.01,0.09789440035820007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,16,1,power_law_1.2,0.09658880233764648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,16,1,power_law_1.2,0.09681280255317688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,2,1,balanced,0.4689919948577881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,2,1,balanced,0.4713493188222249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,2,1,power_law_1.01,0.34917120933532714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,2,1,power_law_1.01,0.3516607999801636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,2,1,power_law_1.2,0.34459519386291504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,2,1,power_law_1.2,0.3471231937408447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,32,1,balanced,0.10098133484522502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,32,1,balanced,0.10159466663996379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,32,1,power_law_1.01,0.08482559919357299
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,32,1,power_law_1.01,0.08485119938850402
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,32,1,power_law_1.2,0.08331519961357117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,32,1,power_law_1.2,0.08424959778785705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,4,1,balanced,0.2583093245824178
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,4,1,balanced,0.26047466198603314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,4,1,power_law_1.01,0.1974079966545105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,4,1,power_law_1.01,0.19778560400009154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,4,1,power_law_1.2,0.19129600524902343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,4,1,power_law_1.2,0.19543039798736572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,8,1,balanced,0.15813333789507547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,8,1,balanced,0.15929599603017172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,8,1,power_law_1.01,0.12617599964141846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,8,1,power_law_1.01,0.1269503951072693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,8,1,power_law_1.2,0.12368639707565307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,256,8,1,power_law_1.2,0.12433919906616211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,1,balanced,1.3295146624247234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,1,balanced,1.3302133083343506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,1,power_law_1.01,0.6725696086883545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,1,power_law_1.01,0.6936895847320557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,1,power_law_1.2,0.6371647834777832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,1,power_law_1.2,0.6435711860656739
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,128,balanced,0.051594664653142296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,128,balanced,0.054655998945236206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,128,power_law_1.01,0.04981760084629059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,128,power_law_1.01,0.05432320237159729
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,128,power_law_1.2,0.047142401337623596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,128,power_law_1.2,0.047219198942184445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,16,balanced,0.12091733018557231
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,16,balanced,0.12138133247693379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,16,power_law_1.01,0.10531200170516967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,16,power_law_1.01,0.1144320011138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,16,power_law_1.2,0.10957440137863159
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,16,power_law_1.2,0.10990079641342163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,2,balanced,0.6824533144632975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,2,balanced,0.6838826338450114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,2,power_law_1.01,0.3864383935928345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,2,power_law_1.01,0.4013696193695068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,2,power_law_1.2,0.37287039756774903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,2,power_law_1.2,0.3751359939575195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,32,balanced,0.07794133325417836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,32,balanced,0.0784746656815211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,32,power_law_1.01,0.06941440105438232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,32,power_law_1.01,0.0717248022556305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,32,power_law_1.2,0.060083198547363284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,32,power_law_1.2,0.06722559928894042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,4,balanced,0.3598666588465373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,4,balanced,0.36059733231862384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,4,power_law_1.01,0.24098560810089112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,4,power_law_1.01,0.2537472009658813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,4,power_law_1.2,0.2127552032470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,4,power_law_1.2,0.2584320068359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,64,balanced,0.058789332707722984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,64,balanced,0.06018133461475372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,64,power_law_1.01,0.050892800092697144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,64,power_law_1.01,0.056569600105285646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,64,power_law_1.2,0.05198079943656921
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,64,power_law_1.2,0.05445759892463684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,8,balanced,0.20060799519220987
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,8,balanced,0.20069332917531332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,8,power_law_1.01,0.15122560262680054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,8,power_law_1.01,0.16206719875335693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,8,power_law_1.2,0.17663999795913696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,1,8,power_law_1.2,0.19898879528045654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,16,1,balanced,0.1604213317235311
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,16,1,balanced,0.16063466668128967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,16,1,power_law_1.01,0.10480639934539795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,16,1,power_law_1.01,0.10493439435958862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,16,1,power_law_1.2,0.0998207986354828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,16,1,power_law_1.2,0.10007679462432861
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,2,1,balanced,0.6864906946818033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,2,1,balanced,0.6884426275889078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,2,1,power_law_1.01,0.36279680728912356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,2,1,power_law_1.01,0.3704319953918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,2,1,power_law_1.2,0.3241472005844116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,2,1,power_law_1.2,0.3469311952590942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,32,1,balanced,0.13173333803812662
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,32,1,balanced,0.13173866271972656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,32,1,power_law_1.01,0.09000319838523865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,32,1,power_law_1.01,0.09141119718551635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,32,1,power_law_1.2,0.08650879859924317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,32,1,power_law_1.2,0.08736000061035157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,4,1,balanced,0.36632001399993896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,4,1,balanced,0.36720001697540283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,4,1,power_law_1.01,0.20699520111083985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,4,1,power_law_1.01,0.2116544008255005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,4,1,power_law_1.2,0.19285119771957399
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,4,1,power_law_1.2,0.19366400241851806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,8,1,balanced,0.21762667099634805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,8,1,balanced,0.21836799383163452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,8,1,power_law_1.01,0.13373440504074097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,8,1,power_law_1.01,0.13441920280456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,8,1,power_law_1.2,0.12672640085220338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,48,7168,2048,8,384,8,1,power_law_1.2,0.12986880540847778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,1,balanced,0.10048533479372661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,1,balanced,0.10071466366449992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,1,power_law_1.01,0.11280640363693237
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,1,power_law_1.01,0.11537280082702636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,1,power_law_1.2,0.11310080289840699
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,1,power_law_1.2,0.1150272011756897
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,128,balanced,0.03743999948104223
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,128,balanced,0.037471999724706016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,128,power_law_1.01,0.036582401394844054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,128,power_law_1.01,0.03751679956912994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,128,power_law_1.2,0.0365119993686676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,128,power_law_1.2,0.036550399661064145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,16,balanced,0.0394400010506312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,16,balanced,0.03965333352486292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,16,power_law_1.01,0.03933440148830414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,16,power_law_1.01,0.03944959938526153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,16,power_law_1.2,0.0392767995595932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,16,power_law_1.2,0.039801600575447085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,2,balanced,0.06261333326498668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,2,balanced,0.0642080008983612
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,2,power_law_1.01,0.06804479956626892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,2,power_law_1.01,0.06830719709396363
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,2,power_law_1.2,0.0686464011669159
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,2,power_law_1.2,0.06958720088005066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,32,balanced,0.039594667653242745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,32,balanced,0.039664000272750854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,32,power_law_1.01,0.037503999471664426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,32,power_law_1.01,0.03809280097484589
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,32,power_law_1.2,0.03723520040512085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,32,power_law_1.2,0.037273600697517395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,4,balanced,0.04593066871166229
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,4,balanced,0.04859733581542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,4,power_law_1.01,0.05079039931297302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,4,power_law_1.01,0.051583999395370485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,4,power_law_1.2,0.04978559911251068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,4,power_law_1.2,0.05231999754905701
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,64,balanced,0.038015998899936676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,64,balanced,0.038586666186650596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,64,power_law_1.01,0.03709439933300018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,64,power_law_1.01,0.037401598691940305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,64,power_law_1.2,0.036671999096870425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,64,power_law_1.2,0.03716480135917664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,8,balanced,0.05006400247414907
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,8,balanced,0.0517546683549881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,8,power_law_1.01,0.04760960042476654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,8,power_law_1.01,0.0489984005689621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,8,power_law_1.2,0.04688000082969666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,1,8,power_law_1.2,0.0520576000213623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,2,1,balanced,0.07293333113193512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,2,1,balanced,0.07386666536331177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,2,1,power_law_1.01,0.07728000283241272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,2,1,power_law_1.01,0.07743359804153442
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,2,1,power_law_1.2,0.07742080092430115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,2,1,power_law_1.2,0.07943040132522583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,4,1,balanced,0.06017066538333893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,4,1,balanced,0.06226666768391927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,4,1,power_law_1.01,0.06233599781990051
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,4,1,power_law_1.01,0.06402559876441956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,4,1,power_law_1.2,0.0643455982208252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,2048,768,8,128,4,1,power_law_1.2,0.06467840075492859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,1,balanced,0.3612053394317627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,1,balanced,0.3646186590194702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,1,power_law_1.01,0.4065216064453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,1,power_law_1.01,0.41216001510620115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,1,power_law_1.2,0.4217663764953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,1,power_law_1.2,0.42488322257995603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,128,balanced,0.043509334325790405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,128,balanced,0.04363200068473816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,128,power_law_1.01,0.04106239974498749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,128,power_law_1.01,0.04110719859600067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,128,power_law_1.2,0.04084480106830597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,128,power_law_1.2,0.041817599534988405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,16,balanced,0.09789866209030151
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,16,balanced,0.10250666737556458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,16,power_law_1.01,0.08214399814605713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,16,power_law_1.01,0.09229440093040467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,16,power_law_1.2,0.07879040241241456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,16,power_law_1.2,0.07948160171508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,2,balanced,0.18517333269119263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,2,balanced,0.18531733751296997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,2,power_law_1.01,0.18883199691772462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,2,power_law_1.01,0.19144320487976074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,2,power_law_1.2,0.19121919870376586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,2,power_law_1.2,0.1945024013519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,256,balanced,0.0436160018046697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,256,balanced,0.04364266494909922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,256,power_law_1.01,0.04095360040664673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,256,power_law_1.01,0.0412992000579834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,256,power_law_1.2,0.04056319892406464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,256,power_law_1.2,0.04103040099143982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,32,balanced,0.058229332168896995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,32,balanced,0.058277333776156105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,32,power_law_1.01,0.05311999917030334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,32,power_law_1.01,0.05354239940643311
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,32,power_law_1.2,0.05343359708786011
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,32,power_law_1.2,0.054611200094223024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,4,balanced,0.11334400375684102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,4,balanced,0.11380267143249512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,4,power_law_1.01,0.1078336000442505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,4,power_law_1.01,0.10895359516143799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,4,power_law_1.2,0.1135103940963745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,4,power_law_1.2,0.11514240503311157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,64,balanced,0.045498669147491455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,64,balanced,0.04635733366012573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,64,power_law_1.01,0.04319359958171844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,64,power_law_1.01,0.04348160028457641
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,64,power_law_1.2,0.044147199392318724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,64,power_law_1.2,0.04465279877185822
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,8,balanced,0.0845973292986552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,8,balanced,0.08533866206804912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,8,power_law_1.01,0.07878400087356567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,8,power_law_1.01,0.07976319789886474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,8,power_law_1.2,0.08018559813499451
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,1,8,power_law_1.2,0.08231040239334106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,2,1,balanced,0.22398932774861655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,2,1,balanced,0.2241226633389791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,2,1,power_law_1.01,0.24936959743499756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,2,1,power_law_1.01,0.24972798824310302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,2,1,power_law_1.2,0.2565824031829834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,2,1,power_law_1.2,0.25785601139068604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,4,1,balanced,0.14478400349617004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,4,1,balanced,0.14574399590492249
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,4,1,power_law_1.01,0.15249279737472535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,4,1,power_law_1.01,0.1536064028739929
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,4,1,power_law_1.2,0.1573632001876831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,4,1,power_law_1.2,0.15749759674072267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,8,1,balanced,0.11476266384124756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,8,1,balanced,0.11542933185895284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,8,1,power_law_1.01,0.12171519994735717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,8,1,power_law_1.01,0.12259839773178101
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,8,1,power_law_1.2,0.12291200160980224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,3072,1536,8,256,8,1,power_law_1.2,0.12383999824523925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,1,balanced,0.2262293299039205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,1,balanced,0.2266613245010376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,1,power_law_1.01,0.2616384029388428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,1,power_law_1.01,0.27111680507659913
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,1,power_law_1.2,0.2699199914932251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,1,power_law_1.2,0.27530879974365235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,2,balanced,0.11375466982523601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,2,balanced,0.11581866939862569
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,2,power_law_1.01,0.16314239501953126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,2,power_law_1.01,0.18328959941864015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,2,power_law_1.2,0.16881920099258424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,2,power_law_1.2,0.1805567979812622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,4,balanced,0.08649599552154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,4,balanced,0.08690133690834045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,4,power_law_1.01,0.14132479429244996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,4,power_law_1.01,0.16727039813995362
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,4,power_law_1.2,0.11875200271606445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,4,power_law_1.2,0.11880960464477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,8,balanced,0.06714133421579997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,8,balanced,0.06950399776299794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,8,power_law_1.01,0.09372159838676453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,8,power_law_1.01,0.10291839838027954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,8,power_law_1.2,0.09342719912528992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,1,8,power_law_1.2,0.09751039743423462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,16,1,balanced,0.04780800143877665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,16,1,balanced,0.04794133206208547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,16,1,power_law_1.01,0.04750080108642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,16,1,power_law_1.01,0.04902400076389313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,16,1,power_law_1.2,0.04844799935817719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,16,1,power_law_1.2,0.04885759949684143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,2,1,balanced,0.12781332929929098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,2,1,balanced,0.12918933232625326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,2,1,power_law_1.01,0.1492095947265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,2,1,power_law_1.01,0.15521279573440552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,2,1,power_law_1.2,0.14979840517044068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,2,1,power_law_1.2,0.15166079998016357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,32,1,balanced,0.04167466859022776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,32,1,balanced,0.04178666571776072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,32,1,power_law_1.01,0.04232319891452789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,32,1,power_law_1.01,0.04430719912052154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,32,1,power_law_1.2,0.042847999930381776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,32,1,power_law_1.2,0.04349440038204193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,4,1,balanced,0.08454400300979614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,4,1,balanced,0.08530666430791219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,4,1,power_law_1.01,0.09366400241851806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,4,1,power_law_1.01,0.0954367995262146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,4,1,power_law_1.2,0.09329280257225037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,4,1,power_law_1.2,0.09423999786376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,8,1,balanced,0.06351466476917267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,8,1,balanced,0.06454400221506755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,8,1,power_law_1.01,0.06632959842681885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,8,1,power_law_1.01,0.06649600267410279
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,8,1,power_law_1.2,0.06684160232543945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,14336,2,8,8,1,power_law_1.2,0.06759039759635925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,1,balanced,0.27029865980148315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,1,balanced,0.2704799969991048
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,1,power_law_1.01,0.31393280029296877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,1,power_law_1.01,0.3170880079269409
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,1,power_law_1.2,0.3276160001754761
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,1,power_law_1.2,0.3284735918045044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,128,balanced,0.04563199977080027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,128,balanced,0.04573333263397217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,128,power_law_1.01,0.044198399782180785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,128,power_law_1.01,0.044531199336051944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,128,power_law_1.2,0.044921600818634035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,128,power_law_1.2,0.04506880044937134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,16,balanced,0.05820799867312113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,16,balanced,0.059248000383377075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,16,power_law_1.01,0.05713919997215271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,16,power_law_1.01,0.0626688003540039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,16,power_law_1.2,0.06157439947128296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,16,power_law_1.2,0.06296319961547851
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,2,balanced,0.14274133245150247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,2,balanced,0.14427733421325684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,2,power_law_1.01,0.15864959955215455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,2,power_law_1.01,0.15907200574874877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,2,power_law_1.2,0.1630784034729004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,2,power_law_1.2,0.1638527989387512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,32,balanced,0.047237331668535866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,32,balanced,0.047775998711586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,32,power_law_1.01,0.047200000286102294
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,32,power_law_1.01,0.04800640046596527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,32,power_law_1.2,0.04828799962997436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,32,power_law_1.2,0.05061119794845581
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,4,balanced,0.09719467163085938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,4,balanced,0.09734400113423665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,4,power_law_1.01,0.09975039958953857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,4,power_law_1.01,0.10079360008239746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,4,power_law_1.2,0.10243200063705445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,4,power_law_1.2,0.10979199409484863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,64,balanced,0.045461331804593406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,64,balanced,0.04607999821503957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,64,power_law_1.01,0.045100799202919005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,64,power_law_1.01,0.045817598700523376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,64,power_law_1.2,0.045184001326560974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,64,power_law_1.2,0.04578559994697571
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,8,balanced,0.09139733513196309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,8,balanced,0.09197866916656494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,8,power_law_1.01,0.07862399816513062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,8,power_law_1.01,0.09549440145492553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,8,power_law_1.2,0.08282880187034607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,1,8,power_law_1.2,0.08362879753112792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,2,1,balanced,0.17233065764109293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,2,1,balanced,0.17254400253295898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,2,1,power_law_1.01,0.19521280527114868
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,2,1,power_law_1.01,0.19872000217437744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,2,1,power_law_1.2,0.20182399749755858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,2,1,power_law_1.2,0.203987193107605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,4,1,balanced,0.11716799934705098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,4,1,balanced,0.11752000451087952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,4,1,power_law_1.01,0.12679040431976318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,4,1,power_law_1.01,0.12735359668731688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,4,1,power_law_1.2,0.12739839553833007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,4,1,power_law_1.2,0.12828160524368287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,8,1,balanced,0.09473599990208943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,8,1,balanced,0.09598400195439656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,8,1,power_law_1.01,0.09931520223617554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,8,1,power_law_1.01,0.09985920190811157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,8,1,power_law_1.2,0.09962239861488342
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,4096,1536,8,128,8,1,power_law_1.2,0.10047999620437623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,1,balanced,0.42878401279449463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,1,balanced,0.4299199978510539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,1,power_law_1.01,0.5061759948730469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,1,power_law_1.01,0.5098048210144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,1,power_law_1.2,0.5139711856842041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,1,power_law_1.2,0.5195007801055909
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,2,balanced,0.16498133540153503
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,2,balanced,0.16562133034070334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,2,power_law_1.01,0.2467967987060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,2,power_law_1.01,0.2630592107772827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,2,power_law_1.2,0.23679358959198
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,2,power_law_1.2,0.26081280708312987
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,4,balanced,0.10796800255775452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,4,balanced,0.10965866843859355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,4,power_law_1.01,0.18519680500030516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,4,power_law_1.01,0.1921280026435852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,4,power_law_1.2,0.1939136028289795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,4,power_law_1.2,0.20025599002838135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,8,balanced,0.08373866478602092
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,8,balanced,0.08463999629020691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,8,power_law_1.01,0.12257280349731445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,8,power_law_1.01,0.13470079898834228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,8,power_law_1.2,0.13015040159225463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,1,8,power_law_1.2,0.13968640565872192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,16,1,balanced,0.0642986645301183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,16,1,balanced,0.0662666658560435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,16,1,power_law_1.01,0.06778879761695862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,16,1,power_law_1.01,0.06844159960746765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,16,1,power_law_1.2,0.06895999908447266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,16,1,power_law_1.2,0.0701632022857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,2,1,balanced,0.18820265928904215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,2,1,balanced,0.1887893279393514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,2,1,power_law_1.01,0.22885119915008545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,2,1,power_law_1.01,0.22951679229736327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,2,1,power_law_1.2,0.22539520263671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,2,1,power_law_1.2,0.234771203994751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,32,1,balanced,0.047797332207361855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,32,1,balanced,0.05295999844868978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,32,1,power_law_1.01,0.05315200090408325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,32,1,power_law_1.01,0.053324800729751584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,32,1,power_law_1.2,0.05206400156021118
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,32,1,power_law_1.2,0.053388798236846925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,4,1,balanced,0.11672533551851909
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,4,1,balanced,0.11796800295511882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,4,1,power_law_1.01,0.13586560487747193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,4,1,power_law_1.01,0.1385151982307434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,4,1,power_law_1.2,0.13624320030212403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,4,1,power_law_1.2,0.13827199935913087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,8,1,balanced,0.08369599779446919
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,8,1,balanced,0.08422399560610454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,8,1,power_law_1.01,0.0900160014629364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,8,1,power_law_1.01,0.09127680063247681
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,8,1,power_law_1.2,0.09016960263252258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,16384,2,8,8,1,power_law_1.2,0.09068800210952759
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,1,balanced,0.9027413527170817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,1,balanced,0.904304027557373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,1,power_law_1.01,1.026585578918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,1,power_law_1.01,1.0522944450378418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,1,power_law_1.2,1.0829440116882325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,1,power_law_1.2,1.0842944145202638
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,128,balanced,0.05258133510748545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,128,balanced,0.05421866476535797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,128,power_law_1.01,0.05140479803085327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,128,power_law_1.01,0.054150402545928955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,128,power_law_1.2,0.051974397897720334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,128,power_law_1.2,0.05203840136528015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,16,balanced,0.16562133034070334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,16,balanced,0.18372267484664917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,16,power_law_1.01,0.12316800355911255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,16,power_law_1.01,0.14062080383300782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,16,power_law_1.2,0.11955840587615967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,16,power_law_1.2,0.13992960453033448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,2,balanced,0.4294240077336629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,2,balanced,0.43113064765930176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,2,power_law_1.01,0.4370368003845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,2,power_law_1.01,0.44202880859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,2,power_law_1.2,0.45452160835266114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,2,power_law_1.2,0.46485118865966796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,256,balanced,0.0517493337392807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,256,balanced,0.05194133520126343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,256,power_law_1.01,0.0505407989025116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,256,power_law_1.01,0.05063679814338684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,256,power_law_1.2,0.05004159808158874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,256,power_law_1.2,0.05013120174407959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,32,balanced,0.08620267113049825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,32,balanced,0.08689600229263306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,32,power_law_1.01,0.07891200184822082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,32,power_law_1.01,0.08039680123329163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,32,power_law_1.2,0.07996159791946411
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,32,power_law_1.2,0.08005120158195496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,4,balanced,0.24014933904012045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,4,balanced,0.2412053346633911
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,4,power_law_1.01,0.22357759475708008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,4,power_law_1.01,0.23452799320220946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,4,power_law_1.2,0.23799679279327393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,4,power_law_1.2,0.24798719882965087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,64,balanced,0.06434666613737743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,64,balanced,0.06584533552328746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,64,power_law_1.01,0.06130560040473938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,64,power_law_1.01,0.06183680295944214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,64,power_law_1.2,0.06378880143165588
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,64,power_law_1.2,0.06467199921607972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,8,balanced,0.16055466731389365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,8,balanced,0.16285866498947144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,8,power_law_1.01,0.14729599952697753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,8,power_law_1.01,0.14759680032730102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,8,power_law_1.2,0.15011839866638182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,1,8,power_law_1.2,0.15511679649353027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,16,1,balanced,0.171450674533844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,16,1,balanced,0.17173866430918375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,16,1,power_law_1.01,0.18444160223007203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,16,1,power_law_1.01,0.18502399921417237
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,16,1,power_law_1.2,0.1869055986404419
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,16,1,power_law_1.2,0.1871999979019165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,2,1,balanced,0.48469332853953045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,2,1,balanced,0.4848053455352783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,2,1,power_law_1.01,0.5333183765411377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,2,1,power_law_1.01,0.5335040092468262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,2,1,power_law_1.2,0.5641920089721679
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,2,1,power_law_1.2,0.5655231952667237
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,32,1,balanced,0.1534293293952942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,32,1,balanced,0.1535040040810903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,32,1,power_law_1.01,0.16711039543151857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,32,1,power_law_1.01,0.1672320008277893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,32,1,power_law_1.2,0.16843520402908324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,32,1,power_law_1.2,0.1689471960067749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,4,1,balanced,0.28964267174402875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,4,1,balanced,0.2934933304786682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,4,1,power_law_1.01,0.3098560094833374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,4,1,power_law_1.01,0.3151488065719604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,4,1,power_law_1.2,0.3241152048110962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,4,1,power_law_1.2,0.32704639434814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,8,1,balanced,0.20566932360331217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,8,1,balanced,0.20637865861256918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,8,1,power_law_1.01,0.22093439102172852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,8,1,power_law_1.01,0.22242560386657714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,8,1,power_law_1.2,0.22518401145935057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2048,8,256,8,1,power_law_1.2,0.22655999660491943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,1,balanced,0.7363893191019694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,1,balanced,0.7367520332336426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,1,power_law_1.01,0.8018239974975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,1,power_law_1.01,0.8100992202758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,1,power_law_1.2,0.8520511627197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,1,power_law_1.2,0.8520895957946777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,16,balanced,0.09693866968154907
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,16,balanced,0.09925867120424907
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,16,power_law_1.01,0.09790080189704894
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,16,power_law_1.01,0.09852799773216248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,16,power_law_1.2,0.10116480588912964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,16,power_law_1.2,0.10565760135650634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,2,balanced,0.35070399443308514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,2,balanced,0.3507680098215739
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,2,power_law_1.01,0.3767807960510254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,2,power_law_1.01,0.3803904056549072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,2,power_law_1.2,0.3832000017166138
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,2,power_law_1.2,0.40319361686706545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,32,balanced,0.07667199770609538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,32,balanced,0.08246933420499165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,32,power_law_1.01,0.07601280212402343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,32,power_law_1.01,0.07859839797019959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,32,power_law_1.2,0.07865599989891052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,32,power_law_1.2,0.08005120158195496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,4,balanced,0.22984532515207926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,4,balanced,0.23148266474405924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,4,power_law_1.01,0.210534405708313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,4,power_law_1.01,0.21841919422149658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,4,power_law_1.2,0.22534399032592772
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,4,power_law_1.2,0.22765440940856935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,8,balanced,0.24965333938598633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,8,balanced,0.2549546758333842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,8,power_law_1.01,0.17863680124282838
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,8,power_law_1.01,0.21605119705200196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,8,power_law_1.2,0.18158719539642335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,1,8,power_law_1.2,0.22459518909454346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,2,1,balanced,0.4103626807530721
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,2,1,balanced,0.41283734639485675
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,2,1,power_law_1.01,0.44216318130493165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,2,1,power_law_1.01,0.4490943908691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,2,1,power_law_1.2,0.46366081237792967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,2,1,power_law_1.2,0.46691198348999025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,4,1,balanced,0.26366933186848956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,4,1,balanced,0.26531734069188434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,4,1,power_law_1.01,0.27992959022521974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,4,1,power_law_1.01,0.2810688018798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,4,1,power_law_1.2,0.2847359895706177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,4,1,power_law_1.2,0.28580479621887206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,8,1,balanced,0.16950400670369467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,8,1,balanced,0.1704746683438619
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,8,1,power_law_1.01,0.1704256057739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,8,1,power_law_1.01,0.17233279943466187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,8,1,power_law_1.2,0.17471359968185424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,6144,2560,8,160,8,1,power_law_1.2,0.17509119510650634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,1,balanced,1.0561439990997314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,1,balanced,1.0582186381022136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,1,power_law_1.01,1.2099519729614259
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,1,power_law_1.01,1.2212608337402344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,1,power_law_1.2,1.2485695838928224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,1,power_law_1.2,1.2796735763549805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,128,balanced,0.05618133147557577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,128,balanced,0.05824000140031179
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,128,power_law_1.01,0.05496320128440857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,128,power_law_1.01,0.05702400207519531
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,128,power_law_1.2,0.056985598802566526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,128,power_law_1.2,0.05807999968528747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,16,balanced,0.18388799826304117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,16,balanced,0.19489065806070963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,16,power_law_1.01,0.13809280395507811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,16,power_law_1.01,0.14395519495010375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,16,power_law_1.2,0.13901439905166627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,16,power_law_1.2,0.1419648051261902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,2,balanced,0.4972746769587199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,2,balanced,0.4973920186360677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,2,power_law_1.01,0.5130815982818604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,2,power_law_1.01,0.5192128181457519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,2,power_law_1.2,0.536300802230835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,2,power_law_1.2,0.5375743865966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,256,balanced,0.054757331808408104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,256,balanced,0.05608533322811127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,256,power_law_1.01,0.053523200750350955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,256,power_law_1.01,0.05384320020675659
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,256,power_law_1.2,0.05539839863777161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,256,power_law_1.2,0.055430400371551516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,32,balanced,0.09405866265296936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,32,balanced,0.09567466378211975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,32,power_law_1.01,0.08819199800491333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,32,power_law_1.01,0.09114879965782166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,32,power_law_1.2,0.09025279879570007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,32,power_law_1.2,0.09205759763717651
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,4,balanced,0.27593066294987995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,4,balanced,0.27666133642196655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,4,power_law_1.01,0.2669503927230835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,4,power_law_1.01,0.27003519535064696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,4,power_law_1.2,0.28017919063568114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,4,power_law_1.2,0.2853503942489624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,64,balanced,0.07449066638946533
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,64,balanced,0.0746666689713796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,64,power_law_1.01,0.06721919775009155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,64,power_law_1.01,0.06774399876594543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,64,power_law_1.2,0.06869760155677795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,64,power_law_1.2,0.07329279780387879
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,8,balanced,0.1834826668103536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,8,balanced,0.18716265757878622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,8,power_law_1.01,0.16227840185165404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,8,power_law_1.01,0.16838400363922118
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,8,power_law_1.2,0.170905601978302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,1,8,power_law_1.2,0.17173759937286376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,16,1,balanced,0.19367466370264688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,16,1,balanced,0.19519466161727905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,16,1,power_law_1.01,0.20941441059112548
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,16,1,power_law_1.01,0.21006081104278565
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,16,1,power_law_1.2,0.21164801120758056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,16,1,power_law_1.2,0.21227519512176513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,2,1,balanced,0.561194658279419
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,2,1,balanced,0.5630026658376058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,2,1,power_law_1.01,0.618995189666748
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,2,1,power_law_1.01,0.6200831890106201
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,2,1,power_law_1.2,0.6467967987060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,2,1,power_law_1.2,0.6525568008422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,32,1,balanced,0.17458132902781168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,32,1,balanced,0.17538666725158691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,32,1,power_law_1.01,0.19005440473556517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,32,1,power_law_1.01,0.19047679901123046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,32,1,power_law_1.2,0.19227520227432252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,32,1,power_law_1.2,0.19294079542160034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,4,1,balanced,0.33402132987976074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,4,1,balanced,0.33826132615407306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,4,1,power_law_1.01,0.3606719970703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,4,1,power_law_1.01,0.3626496076583862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,4,1,power_law_1.2,0.3735680103302002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,4,1,power_law_1.2,0.37430400848388673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,8,1,balanced,0.23642132679621378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,8,1,balanced,0.2368746598561605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,8,1,power_law_1.01,0.2547904014587402
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,8,1,power_law_1.01,0.25845119953155515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,8,1,power_law_1.2,0.25731201171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,256,8,1,power_law_1.2,0.25886080265045164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,1,balanced,1.5459893544514973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,1,balanced,1.5518827438354492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,1,power_law_1.01,1.4295231819152832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,1,power_law_1.01,1.4348992347717284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,1,power_law_1.2,1.487622356414795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,1,power_law_1.2,1.4947711944580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,128,balanced,0.06221333146095276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,128,balanced,0.06398933132489522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,128,power_law_1.01,0.06182399988174438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,128,power_law_1.01,0.062041598558425906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,128,power_law_1.2,0.060812801122665405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,128,power_law_1.2,0.06206079721450806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,16,balanced,0.365013321240743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,16,balanced,0.3658133347829183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,16,power_law_1.01,0.2294015884399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,16,power_law_1.01,0.25243520736694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,16,power_law_1.2,0.22339200973510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,16,power_law_1.2,0.23237760066986085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,2,balanced,0.7130080064137777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,2,balanced,0.7135146458943685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,2,power_law_1.01,0.6495359897613525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,2,power_law_1.01,0.6853631973266602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,2,power_law_1.2,0.6753791809082031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,2,power_law_1.2,0.6765183925628662
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,32,balanced,0.10827199618021648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,32,balanced,0.1109333336353302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,32,power_law_1.01,0.1000704050064087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,32,power_law_1.01,0.103603196144104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,32,power_law_1.2,0.09883520007133484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,32,power_law_1.2,0.10072319507598877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,4,balanced,0.3859413464864095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,4,balanced,0.3861973285675049
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,4,power_law_1.01,0.3568959951400757
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,4,power_law_1.01,0.35902719497680663
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,4,power_law_1.2,0.3451711893081665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,4,power_law_1.2,0.35482239723205566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,64,balanced,0.08668800195058186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,64,balanced,0.0867733359336853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,64,power_law_1.01,0.08216320276260376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,64,power_law_1.01,0.0857151985168457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,64,power_law_1.2,0.08153600096702576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,64,power_law_1.2,0.08239359855651855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,8,balanced,0.28357867399851483
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,8,balanced,0.2925173242886861
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,8,power_law_1.01,0.21943039894104005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,8,power_law_1.01,0.22004480361938478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,8,power_law_1.2,0.21143040657043458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,1,8,power_law_1.2,0.23029119968414308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,16,1,balanced,0.2534613410631816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,16,1,balanced,0.25463465849558514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,16,1,power_law_1.01,0.2309119939804077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,16,1,power_law_1.01,0.23315839767456054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,16,1,power_law_1.2,0.2331007957458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,16,1,power_law_1.2,0.23438720703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,2,1,balanced,0.8037066459655762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,2,1,balanced,0.8094720045725504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,2,1,power_law_1.01,0.7291840076446533
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,2,1,power_law_1.01,0.743180799484253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,2,1,power_law_1.2,0.7528319835662842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,2,1,power_law_1.2,0.7578112125396729
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,32,1,balanced,0.22420799732208252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,32,1,balanced,0.22551467021306357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,32,1,power_law_1.01,0.2055743932723999
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,32,1,power_law_1.01,0.2071615934371948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,32,1,power_law_1.2,0.2084736108779907
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,32,1,power_law_1.2,0.20974080562591552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,4,1,balanced,0.4627679983774821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,4,1,balanced,0.46532801787058514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,4,1,power_law_1.01,0.4146560192108154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,4,1,power_law_1.01,0.4284992218017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,4,1,power_law_1.2,0.4258111953735352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,4,1,power_law_1.2,0.4265920162200928
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,8,1,balanced,0.3134239912033081
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,8,1,balanced,0.31492799520492554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,8,1,power_law_1.01,0.2823231935501099
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,8,1,power_law_1.01,0.28387839794158937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,8,1,power_law_1.2,0.289900803565979
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,512,7168,2048,8,384,8,1,power_law_1.2,0.29281280040740965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,1,balanced,0.3412160078684489
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,1,balanced,0.3478826681772868
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,1,power_law_1.01,0.38391680717468263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,1,power_law_1.01,0.38607358932495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,1,power_law_1.2,0.3906303882598877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,1,power_law_1.2,0.3923007965087891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,128,balanced,0.08463467160860698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,128,balanced,0.0846453309059143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,128,power_law_1.01,0.0964735984802246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,128,power_law_1.01,0.09685760140419006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,128,power_law_1.2,0.11196160316467285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,128,power_law_1.2,0.11230720281600952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,16,balanced,0.10259200135866801
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,16,balanced,0.10262399911880493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,16,power_law_1.01,0.12609280347824098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,16,power_law_1.01,0.1271232008934021
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,16,power_law_1.2,0.13177599906921386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,16,power_law_1.2,0.13446400165557862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,2,balanced,0.21656533082326254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,2,balanced,0.21814932425816855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,2,power_law_1.01,0.2483135938644409
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,2,power_law_1.01,0.2513344049453735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,2,power_law_1.2,0.27219200134277344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,2,power_law_1.2,0.2728832006454468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,32,balanced,0.09020266930262248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,32,balanced,0.09103999535242717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,32,power_law_1.01,0.1093440055847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,32,power_law_1.01,0.10947840213775635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,32,power_law_1.2,0.12016639709472657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,32,power_law_1.2,0.12370560169219971
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,4,balanced,0.15154666701952615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,4,balanced,0.1519253353277842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,4,power_law_1.01,0.18045439720153808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,4,power_law_1.01,0.18859519958496093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,4,power_law_1.2,0.18522239923477174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,4,power_law_1.2,0.19723520278930665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,64,balanced,0.08552533388137817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,64,balanced,0.08630399902661641
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,64,power_law_1.01,0.10208640098571778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,64,power_law_1.01,0.10513919591903687
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,64,power_law_1.2,0.11744639873504639
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,64,power_law_1.2,0.1176576018333435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,8,balanced,0.11869866649309795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,8,balanced,0.11937600374221802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,8,power_law_1.01,0.14392319917678834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,8,power_law_1.01,0.1466048002243042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,8,power_law_1.2,0.14940160512924194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,1,8,power_law_1.2,0.15180799961090088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,2,1,balanced,0.2602506677309672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,2,1,balanced,0.26157333453496295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,2,1,power_law_1.01,0.28042240142822267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,2,1,power_law_1.01,0.28192639350891113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,2,1,power_law_1.2,0.2823551893234253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,2,1,power_law_1.2,0.28266880512237547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,4,1,balanced,0.22509866952896118
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,4,1,balanced,0.22533865769704184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,4,1,power_law_1.01,0.2375488042831421
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,4,1,power_law_1.01,0.23891839981079102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,4,1,power_law_1.2,0.24084479808807374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,2048,768,8,128,4,1,power_law_1.2,0.2420799970626831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,1,balanced,1.4272799491882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,1,balanced,1.4288105964660645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,1,power_law_1.01,0.8170880317687989
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,1,power_law_1.01,0.8220416069030761
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,1,power_law_1.2,0.8573887825012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,1,power_law_1.2,0.8583488464355469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,128,balanced,0.12009066343307495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,128,balanced,0.12101866801579793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,128,power_law_1.01,0.1356287956237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,128,power_law_1.01,0.1383296012878418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,128,power_law_1.2,0.14752639532089235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,128,power_law_1.2,0.15279359817504884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,16,balanced,0.16009599963823953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,16,balanced,0.1606666644414266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,16,power_law_1.01,0.1835904002189636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,16,power_law_1.01,0.1891711950302124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,16,power_law_1.2,0.1997760057449341
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,16,power_law_1.2,0.2002943992614746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,2,balanced,0.5671893358230591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,2,balanced,0.5699626604715983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,2,power_law_1.01,0.4893439769744873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,2,power_law_1.01,0.49010558128356935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,2,power_law_1.2,0.5230656147003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,2,power_law_1.2,0.5363903999328613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,256,balanced,0.11648000280062358
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,256,balanced,0.11872000495592754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,256,power_law_1.01,0.12984960079193114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,256,power_law_1.01,0.1319424033164978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,256,power_law_1.2,0.1427199959754944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,256,power_law_1.2,0.14317439794540404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,32,balanced,0.13662933309872946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,32,balanced,0.13809067010879517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,32,power_law_1.01,0.16165119409561157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,32,power_law_1.01,0.16310399770736694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,32,power_law_1.2,0.17260160446166992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,32,power_law_1.2,0.17581440210342408
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,4,balanced,0.2744693358739217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,4,balanced,0.27454932530721027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,4,power_law_1.01,0.3039680004119873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,4,power_law_1.01,0.3209536075592041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,4,power_law_1.2,0.3329792022705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,4,power_law_1.2,0.3564800024032593
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,64,balanced,0.1276746690273285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,64,balanced,0.12966932853062949
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,64,power_law_1.01,0.14402559995651246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,64,power_law_1.01,0.1477311968803406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,64,power_law_1.2,0.15717120170593263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,64,power_law_1.2,0.16216959953308105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,8,balanced,0.1988053321838379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,8,balanced,0.20003199577331543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,8,power_law_1.01,0.22714879512786865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,8,power_law_1.01,0.2276992082595825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,8,power_law_1.2,0.248089599609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,1,8,power_law_1.2,0.25002241134643555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,2,1,balanced,0.813215970993042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,2,1,balanced,0.8144640127817789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,2,1,power_law_1.01,0.5116415977478027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,2,1,power_law_1.01,0.5122816085815429
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,2,1,power_law_1.2,0.5288000106811523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,2,1,power_law_1.2,0.5291903972625732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,4,1,balanced,0.5241386493047079
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,4,1,balanced,0.5258986552556356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,4,1,power_law_1.01,0.37397758960723876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,4,1,power_law_1.01,0.3761728048324585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,4,1,power_law_1.2,0.3842047929763794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,4,1,power_law_1.2,0.3844480037689209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,8,1,balanced,0.4217333396275838
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,8,1,balanced,0.4236533244450887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,8,1,power_law_1.01,0.3241600036621094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,8,1,power_law_1.01,0.3270848035812378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,8,1,power_law_1.2,0.3330751895904541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,3072,1536,8,256,8,1,power_law_1.2,0.33400959968566896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,1,balanced,1.2633546988169353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,1,balanced,1.2719306945800781
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,1,power_law_1.01,1.3223360061645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,1,power_law_1.01,1.3385024070739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,1,power_law_1.2,1.291756820678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,1,power_law_1.2,1.3210368156433105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,2,balanced,0.6878399848937988
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,2,balanced,0.6929600238800049
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,2,power_law_1.01,0.8530303955078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,2,power_law_1.01,0.8872320175170898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,2,power_law_1.2,0.8065152168273926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,2,power_law_1.2,0.9515711784362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,4,balanced,0.4134666522343953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,4,balanced,0.41368532180786133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,4,power_law_1.01,0.7026944160461426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,4,power_law_1.01,0.7646975994110108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,4,power_law_1.2,0.728172779083252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,4,power_law_1.2,0.7732800006866455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,8,balanced,0.27243200937906903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,8,balanced,0.2728586594263713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,8,power_law_1.01,0.6494719982147217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,8,power_law_1.01,0.6512383937835693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,8,power_law_1.2,0.6164095878601075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,1,8,power_law_1.2,0.644812822341919
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,16,1,balanced,0.22479466597239176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,16,1,balanced,0.2259999910990397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,16,1,power_law_1.01,0.22727680206298828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,16,1,power_law_1.01,0.22841598987579345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,16,1,power_law_1.2,0.2275455951690674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,16,1,power_law_1.2,0.22817280292510986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,2,1,balanced,0.6873813470204672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,2,1,balanced,0.6880053679148356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,2,1,power_law_1.01,0.7264319896697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,2,1,power_law_1.01,0.7367551803588868
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,2,1,power_law_1.2,0.720198392868042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,2,1,power_law_1.2,0.7548672199249268
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,32,1,balanced,0.19501866896947226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,32,1,balanced,0.19545066356658936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,32,1,power_law_1.01,0.19383039474487304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,32,1,power_law_1.01,0.1955456018447876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,32,1,power_law_1.2,0.19438079595565796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,32,1,power_law_1.2,0.19550080299377443
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,4,1,balanced,0.4217226505279541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,4,1,balanced,0.42280534903208417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,4,1,power_law_1.01,0.4345407962799072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,4,1,power_law_1.01,0.43459200859069824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,4,1,power_law_1.2,0.43256320953369143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,4,1,power_law_1.2,0.4610176086425781
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,8,1,balanced,0.29126934210459393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,8,1,balanced,0.2929973403612773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,8,1,power_law_1.01,0.29831039905548096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,8,1,power_law_1.01,0.29922559261322024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,8,1,power_law_1.2,0.2998143911361694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,14336,2,8,8,1,power_law_1.2,0.3048255920410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,1,balanced,0.7413067022959391
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,1,balanced,0.7430773576100668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,1,power_law_1.01,0.8485247611999511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,1,power_law_1.01,0.8492351531982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,1,power_law_1.2,0.8495552062988281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,1,power_law_1.2,0.8739456176757813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,128,balanced,0.14703466494878134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,128,balanced,0.14801599582036337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,128,power_law_1.01,0.17570559978485106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,128,power_law_1.01,0.1773695945739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,128,power_law_1.2,0.20158720016479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,128,power_law_1.2,0.2023168087005615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,16,balanced,0.17641599973042807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,16,balanced,0.17730132738749185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,16,power_law_1.01,0.21976959705352783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,16,power_law_1.01,0.2413503885269165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,16,power_law_1.2,0.24854400157928466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,16,power_law_1.2,0.25454719066619874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,2,balanced,0.4225493272145589
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,2,balanced,0.4240640004475911
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,2,power_law_1.01,0.523744010925293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,2,power_law_1.01,0.5387904167175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,2,power_law_1.2,0.5037759780883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,2,power_law_1.2,0.5651840209960938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,32,balanced,0.15657599767049155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,32,balanced,0.15768000483512878
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,32,power_law_1.01,0.19587199687957763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,32,power_law_1.01,0.20770559310913086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,32,power_law_1.2,0.21203839778900146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,32,power_law_1.2,0.22464001178741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,4,balanced,0.2816693385442098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,4,balanced,0.282645324865977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,4,power_law_1.01,0.3527103900909424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,4,power_law_1.01,0.36456320285797117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,4,power_law_1.2,0.40014081001281737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,4,power_law_1.2,0.4027775764465332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,64,balanced,0.14870933691660562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,64,balanced,0.15030399958292642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,64,power_law_1.01,0.1851904034614563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,64,power_law_1.01,0.18570879697799683
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,64,power_law_1.2,0.20278398990631102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,64,power_law_1.2,0.20899200439453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,8,balanced,0.21185066302617392
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,8,balanced,0.21333332856496176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,8,power_law_1.01,0.2700608015060425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,8,power_law_1.01,0.2760576009750366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,8,power_law_1.2,0.27450239658355713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,1,8,power_law_1.2,0.2957184076309204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,2,1,balanced,0.49211732546488446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,2,1,balanced,0.49530665079752606
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,2,1,power_law_1.01,0.5426623821258545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,2,1,power_law_1.01,0.5443456172943115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,2,1,power_law_1.2,0.5542463779449462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,2,1,power_law_1.2,0.5545599937438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,4,1,balanced,0.38412801424662274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,4,1,balanced,0.38661332925160724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,4,1,power_law_1.01,0.41763839721679685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,4,1,power_law_1.01,0.41913599967956544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,4,1,power_law_1.2,0.42407679557800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,4,1,power_law_1.2,0.42461438179016114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,8,1,balanced,0.34907734394073486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,8,1,balanced,0.34937067826588947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,8,1,power_law_1.01,0.36666240692138674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,8,1,power_law_1.01,0.36808319091796876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,8,1,power_law_1.2,0.36995840072631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,4096,1536,8,128,8,1,power_law_1.2,0.3750272035598755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,1,balanced,2.4692160288492837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,1,balanced,2.4873600006103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,1,power_law_1.01,2.597222328186035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,1,power_law_1.01,2.6848575592041017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,1,power_law_1.2,2.5893695831298826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,1,power_law_1.2,2.616441535949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,2,balanced,1.3033546606699626
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,2,balanced,1.3070346514383953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,2,power_law_1.01,1.6685440063476562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,2,power_law_1.01,1.853580856323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,2,power_law_1.2,1.7029184341430663
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,2,power_law_1.2,1.8245183944702148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,4,balanced,0.6987893581390381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,4,balanced,0.7001439730326334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,4,power_law_1.01,1.3340479850769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,4,power_law_1.01,1.3577216148376465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,4,power_law_1.2,1.5145024299621581
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,4,power_law_1.2,1.5431232452392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,8,balanced,0.41661866505940753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,8,balanced,0.4228266477584839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,8,power_law_1.01,1.1842559814453124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,8,power_law_1.01,1.2013631820678712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,8,power_law_1.2,1.2503423690795898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,1,8,power_law_1.2,1.2524288177490235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,16,1,balanced,0.32361066341400146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,16,1,balanced,0.3237333297729492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,16,1,power_law_1.01,0.32610559463500977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,16,1,power_law_1.01,0.3270400047302246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,16,1,power_law_1.2,0.3245824098587036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,16,1,power_law_1.2,0.3284480094909668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,2,1,balanced,1.102778673171997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,2,1,balanced,1.1079946358998616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,2,1,power_law_1.01,1.1550911903381347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,2,1,power_law_1.01,1.1612031936645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,2,1,power_law_1.2,1.1440383911132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,2,1,power_law_1.2,1.1440640449523927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,32,1,balanced,0.27129065990448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,32,1,balanced,0.27222933371861774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,32,1,power_law_1.01,0.27308800220489504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,32,1,power_law_1.01,0.2734272003173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,32,1,power_law_1.2,0.2726016044616699
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,32,1,power_law_1.2,0.27333118915557864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,4,1,balanced,0.651690681775411
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,4,1,balanced,0.653498649597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,4,1,power_law_1.01,0.6718272209167481
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,4,1,power_law_1.01,0.6770559787750244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,4,1,power_law_1.2,0.6898816108703614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,4,1,power_law_1.2,0.690118408203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,8,1,balanced,0.43380268414815265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,8,1,balanced,0.4349120060602824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,8,1,power_law_1.01,0.44330878257751466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,8,1,power_law_1.01,0.44357762336730955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,8,1,power_law_1.2,0.4480447769165039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,16384,2,8,8,1,power_law_1.2,0.44855680465698244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,1,balanced,3.063647905985514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,1,balanced,3.0715147654215493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,1,power_law_1.01,1.8869247436523438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,1,power_law_1.01,1.9086336135864257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,1,power_law_1.2,1.9783615112304687
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,1,power_law_1.2,1.982111930847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,128,balanced,0.2076639930407206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,128,balanced,0.20805333058039346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,128,power_law_1.01,0.2448256015777588
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,128,power_law_1.01,0.2471679925918579
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,128,power_law_1.2,0.2616767883300781
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,128,power_law_1.2,0.2750272035598755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,16,balanced,0.2828213373819987
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,16,balanced,0.2871466676394145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,16,power_law_1.01,0.3427200078964233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,16,power_law_1.01,0.36455678939819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,16,power_law_1.2,0.3719935894012451
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,16,power_law_1.2,0.3870975971221924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,2,balanced,1.169157346089681
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,2,balanced,1.1747626463572185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,2,power_law_1.01,1.0959487915039063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,2,power_law_1.01,1.1049983978271485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,2,power_law_1.2,1.108505630493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,2,power_law_1.2,1.1414143562316894
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,256,balanced,0.20358399550120035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,256,balanced,0.20491733153661093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,256,power_law_1.01,0.22766079902648925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,256,power_law_1.01,0.22892160415649415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,256,power_law_1.2,0.25899519920349123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,256,power_law_1.2,0.25934720039367676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,32,balanced,0.24381866057713827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,32,balanced,0.2443466583887736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,32,power_law_1.01,0.3007744073867798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,32,power_law_1.01,0.306112003326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,32,power_law_1.2,0.32467200756073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,32,power_law_1.2,0.32527999877929686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,4,balanced,0.552127997080485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,4,balanced,0.5525813500086466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,4,power_law_1.01,0.608460807800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,4,power_law_1.01,0.6589568138122559
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,4,power_law_1.2,0.6993343830108643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,4,power_law_1.2,0.7578368186950684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,64,balanced,0.2178879976272583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,64,balanced,0.22005865971247354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,64,power_law_1.01,0.2528320074081421
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,64,power_law_1.01,0.2572927951812744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,64,power_law_1.2,0.28062078952789304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,64,power_law_1.2,0.2870527982711792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,8,balanced,0.3731733163197835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,8,balanced,0.37481598059336346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,8,power_law_1.01,0.43462400436401366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,8,power_law_1.01,0.4457536220550537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,8,power_law_1.2,0.48142080307006835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,1,8,power_law_1.2,0.4924160003662109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,16,1,balanced,0.5535786549250284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,16,1,balanced,0.5538186629613241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,16,1,power_law_1.01,0.4918528079986572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,16,1,power_law_1.01,0.49331841468811033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,16,1,power_law_1.2,0.5036928176879882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,16,1,power_law_1.2,0.504697608947754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,2,1,balanced,1.6024692853291829
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,2,1,balanced,1.6133920351664226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,2,1,power_law_1.01,1.087615966796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,2,1,power_law_1.01,1.109670352935791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,2,1,power_law_1.2,1.1260736465454102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,2,1,power_law_1.2,1.1358336448669433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,32,1,balanced,0.5482826630274454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,32,1,balanced,0.5609600146611532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,32,1,power_law_1.01,0.5035071849822998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,32,1,power_law_1.01,0.5062655925750732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,32,1,power_law_1.2,0.517516803741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,32,1,power_law_1.2,0.5218111991882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,4,1,balanced,0.9769066969553629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,4,1,balanced,0.9782133102416992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,4,1,power_law_1.01,0.7200575828552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,4,1,power_law_1.01,0.7395328044891357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,4,1,power_law_1.2,0.7495935916900635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,4,1,power_law_1.2,0.7564223766326904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,8,1,balanced,0.6896853446960449
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,8,1,balanced,0.6924373308817545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,8,1,power_law_1.01,0.5587967872619629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,8,1,power_law_1.01,0.5623744010925293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,8,1,power_law_1.2,0.5778816223144532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2048,8,256,8,1,power_law_1.2,0.582860803604126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,1,balanced,2.8401705423990884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,1,balanced,2.850015958150228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,1,power_law_1.01,1.966182327270508
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,1,power_law_1.01,1.9729856491088866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,1,power_law_1.2,1.9990079879760743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,1,power_law_1.2,2.0081600189208983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,16,balanced,0.2985066572825114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,16,balanced,0.2993493278821309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,16,power_law_1.01,0.3803136110305786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,16,power_law_1.01,0.409881591796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,16,power_law_1.2,0.4197567939758301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,16,power_law_1.2,0.4682432174682617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,2,balanced,1.1632213592529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,2,balanced,1.165285348892212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,2,power_law_1.01,1.1218175888061523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,2,power_law_1.01,1.141427230834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,2,power_law_1.2,1.2133952140808106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,2,power_law_1.2,1.2499584197998046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,32,balanced,0.2504799962043762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,32,balanced,0.2513226668039958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,32,power_law_1.01,0.3122495889663696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,32,power_law_1.01,0.3343744039535522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,32,power_law_1.2,0.36871039867401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,32,power_law_1.2,0.39076480865478513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,4,balanced,0.5869013468424479
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,4,balanced,0.589792013168335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,4,power_law_1.01,0.6784128189086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,4,power_law_1.01,0.7074624061584472
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,4,power_law_1.2,0.7548351764678956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,4,power_law_1.2,0.7755519866943359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,8,balanced,0.3917333285013835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,8,balanced,0.3924479881922404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,8,power_law_1.01,0.4788671970367432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,8,power_law_1.01,0.4871103763580322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,8,power_law_1.2,0.5301055908203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,1,8,power_law_1.2,0.5465343952178955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,2,1,balanced,1.5905067125956218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,2,1,balanced,1.5939040184020996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,2,1,power_law_1.01,1.14835844039917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,2,1,power_law_1.01,1.1552448272705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,2,1,power_law_1.2,1.1621376037597657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,2,1,power_law_1.2,1.1826111793518066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,4,1,balanced,0.9937333265940348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,4,1,balanced,0.9991253217061361
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,4,1,power_law_1.01,0.7580736160278321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,4,1,power_law_1.01,0.7580927848815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,4,1,power_law_1.2,0.7678271770477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,4,1,power_law_1.2,0.770470380783081
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,8,1,balanced,0.7338879903157552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,8,1,balanced,0.7584053675333658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,8,1,power_law_1.01,0.6038591861724854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,8,1,power_law_1.01,0.6080063819885254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,8,1,power_law_1.2,0.615065622329712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,6144,2560,8,160,8,1,power_law_1.2,0.6215424060821533
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,1,balanced,3.313536008199056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,1,balanced,3.472506523132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,1,power_law_1.01,2.220275115966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,1,power_law_1.01,2.226278305053711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,1,power_law_1.2,2.283238410949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,1,power_law_1.2,2.3416704177856444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,128,balanced,0.23610132932662964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,128,balanced,0.23640000820159912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,128,power_law_1.01,0.27425920963287354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,128,power_law_1.01,0.27596800327301024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,128,power_law_1.2,0.30312960147857665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,128,power_law_1.2,0.3187135934829712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,16,balanced,0.3227199912071228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,16,balanced,0.32737600803375244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,16,power_law_1.01,0.38431360721588137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,16,power_law_1.01,0.39232640266418456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,16,power_law_1.2,0.41804161071777346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,16,power_law_1.2,0.4210752010345459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,2,balanced,1.3005867004394531
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,2,balanced,1.3121973673502605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,2,power_law_1.01,1.2436160087585448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,2,power_law_1.01,1.2557760238647462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,2,power_law_1.2,1.2632960319519042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,2,power_law_1.2,1.30447359085083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,256,balanced,0.23221333821614584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,256,balanced,0.23302932580312094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,256,power_law_1.01,0.2586047887802124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,256,power_law_1.01,0.2607167959213257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,256,power_law_1.2,0.2897536039352417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,256,power_law_1.2,0.2960639953613281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,32,balanced,0.2762719988822937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,32,balanced,0.2769706646601359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,32,power_law_1.01,0.33388800621032716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,32,power_law_1.01,0.34403839111328127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,32,power_law_1.2,0.37455999851226807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,32,power_law_1.2,0.38185598850250246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,4,balanced,0.6393013397852579
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,4,balanced,0.6407466729482015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,4,power_law_1.01,0.7319744110107422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,4,power_law_1.01,0.7571392059326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,4,power_law_1.2,0.8126784324645996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,4,power_law_1.2,0.822713565826416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,64,balanced,0.25006399552027386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,64,balanced,0.25097066164016724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,64,power_law_1.01,0.29092481136322024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,64,power_law_1.01,0.2993664026260376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,64,power_law_1.2,0.33013119697570803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,64,power_law_1.2,0.3409087896347046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,8,balanced,0.4277333418528239
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,8,balanced,0.43004798889160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,8,power_law_1.01,0.5248703956604004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,8,power_law_1.01,0.5262527942657471
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,8,power_law_1.2,0.560262393951416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,1,8,power_law_1.2,0.5644735813140869
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,16,1,balanced,0.6117493311564127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,16,1,balanced,0.627402663230896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,16,1,power_law_1.01,0.5645311832427978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,16,1,power_law_1.01,0.5678143978118897
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,16,1,power_law_1.2,0.5752384185791015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,16,1,power_law_1.2,0.5778048038482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,2,1,balanced,1.7410133679707844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,2,1,balanced,1.8298452695210774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,2,1,power_law_1.01,1.260159969329834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,2,1,power_law_1.01,1.291539192199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,2,1,power_law_1.2,1.3156864166259765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,2,1,power_law_1.2,1.323481559753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,32,1,balanced,0.6151306629180908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,32,1,balanced,0.619210680325826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,32,1,power_law_1.01,0.5769472122192383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,32,1,power_law_1.01,0.576966381072998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,32,1,power_law_1.2,0.5886335849761963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,32,1,power_law_1.2,0.5991936206817627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,4,1,balanced,1.074064016342163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,4,1,balanced,1.0757013161977131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,4,1,power_law_1.01,0.8338879585266114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,4,1,power_law_1.01,0.839635181427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,4,1,power_law_1.2,0.8668352127075195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,4,1,power_law_1.2,0.8697024345397949
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,8,1,balanced,0.768234650293986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,8,1,balanced,0.7735573450724283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,8,1,power_law_1.01,0.6441855907440186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,8,1,power_law_1.01,0.6504384040832519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,8,1,power_law_1.2,0.661740779876709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,256,8,1,power_law_1.2,0.666374397277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,1,balanced,2.366005261739095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,1,balanced,2.3826346397399902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,1,power_law_1.01,2.753203201293945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,1,power_law_1.01,2.792518424987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,1,power_law_1.2,2.8920255661010743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,1,power_law_1.2,2.9266239166259767
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,128,balanced,0.23612266778945923
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,128,balanced,0.2384373346964518
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,128,power_law_1.01,0.2694144010543823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,128,power_law_1.01,0.2768768072128296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,128,power_law_1.2,0.28687999248504636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,128,power_law_1.2,0.2876287937164307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,16,balanced,0.3290239969889323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,16,balanced,0.329365332921346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,16,power_law_1.01,0.39624319076538084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,16,power_law_1.01,0.4049856185913086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,16,power_law_1.2,0.44040961265563966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,16,power_law_1.2,0.45233922004699706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,2,balanced,1.0511306921641033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,2,balanced,1.0513546466827393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,2,power_law_1.01,1.4187392234802245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,2,power_law_1.01,1.4256319999694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,2,power_law_1.2,1.4854592323303222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,2,power_law_1.2,1.5673151969909669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,32,balanced,0.2767893274625142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,32,balanced,0.2773546576499939
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,32,power_law_1.01,0.32632319927215575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,32,power_law_1.01,0.3326911926269531
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,32,power_law_1.2,0.351910400390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,32,power_law_1.2,0.3640064001083374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,4,balanced,0.6283626556396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,4,balanced,0.6292746861775717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,4,power_law_1.01,0.8220928192138672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,4,power_law_1.01,0.8390399932861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,4,power_law_1.2,0.9080191612243652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,4,power_law_1.2,0.9308095932006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,64,balanced,0.2521973252296448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,64,balanced,0.25277332464853924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,64,power_law_1.01,0.28915839195251464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,64,power_law_1.01,0.2931328058242798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,64,power_law_1.2,0.32090880870819094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,64,power_law_1.2,0.3233151912689209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,8,balanced,0.4278453191121419
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,8,balanced,0.4280266761779785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,8,power_law_1.01,0.542790412902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,8,power_law_1.01,0.564467191696167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,8,power_law_1.2,0.5929984092712403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,1,8,power_law_1.2,0.593068790435791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,16,1,balanced,0.6382346550623575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,16,1,balanced,0.6778293450673422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,16,1,power_law_1.01,0.6905856132507324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,16,1,power_law_1.01,0.6955520153045655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,16,1,power_law_1.2,0.7050879955291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,16,1,power_law_1.2,0.706496000289917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,2,1,balanced,1.3598772684733074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,2,1,balanced,1.3749440511067708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,2,1,power_law_1.01,1.5707776069641113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,2,1,power_law_1.01,1.5740032196044922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,2,1,power_law_1.2,1.6305343627929687
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,2,1,power_law_1.2,1.6370431900024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,32,1,balanced,0.6549599965413412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,32,1,balanced,0.6552000045776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,32,1,power_law_1.01,0.7387519836425781
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,32,1,power_law_1.01,0.7558720111846924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,32,1,power_law_1.2,0.7441855907440186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,32,1,power_law_1.2,0.7568384170532226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,4,1,balanced,0.8720320065816244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,4,1,balanced,0.8737013339996338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,4,1,power_law_1.01,0.9726335525512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,4,1,power_law_1.01,0.9773695945739747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,4,1,power_law_1.2,1.0127039909362794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,4,1,power_law_1.2,1.0130880355834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,8,1,balanced,0.7010613282521566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,8,1,balanced,0.7859146595001221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,8,1,power_law_1.01,0.7687679767608643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,8,1,power_law_1.01,0.7716288089752197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,8,1,power_law_1.2,0.7899072170257568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,6144,7168,2048,8,384,8,1,power_law_1.2,0.7937535762786865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,1,balanced,0.08361066381136577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,1,balanced,0.0843946635723114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,1,power_law_1.01,0.07708799839019775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,1,power_law_1.01,0.07795199751853943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,1,power_law_1.2,0.07783039808273315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,1,power_law_1.2,0.07785599827766418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,128,balanced,0.03535466641187668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,128,balanced,0.03649600098530451
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,128,power_law_1.01,0.03332479894161224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,128,power_law_1.01,0.03480319976806641
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,128,power_law_1.2,0.03280639946460724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,128,power_law_1.2,0.03380480110645294
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,16,balanced,0.03329066683848699
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,16,balanced,0.033573334415753685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,16,power_law_1.01,0.03049600124359131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,16,power_law_1.01,0.031097599864006044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,16,power_law_1.2,0.03155199885368347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,16,power_law_1.2,0.0315775990486145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,2,balanced,0.058543999989827476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,2,balanced,0.05899199843406677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,2,power_law_1.01,0.05573760271072388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,2,power_law_1.01,0.057107198238372806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,2,power_law_1.2,0.05644800066947937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,2,power_law_1.2,0.05787519812583923
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,32,balanced,0.03275199979543686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,32,balanced,0.03335466732581457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,32,power_law_1.01,0.030483201146125793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,32,power_law_1.01,0.031148800253868104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,32,power_law_1.2,0.029388800263404846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,32,power_law_1.2,0.030451199412345885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,4,balanced,0.03691199918588003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,4,balanced,0.04061333338419596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,4,power_law_1.01,0.038553598523139956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,4,power_law_1.01,0.039443200826644896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,4,power_law_1.2,0.039001598954200745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,4,power_law_1.2,0.03922559916973114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,64,balanced,0.03533333291610082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,64,balanced,0.03751466671625773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,64,power_law_1.01,0.03356159925460815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,64,power_law_1.01,0.0350271999835968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,64,power_law_1.2,0.03379839956760407
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,64,power_law_1.2,0.03456639945507049
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,8,balanced,0.03329066683848699
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,8,balanced,0.03338133295377096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,8,power_law_1.01,0.030943998694419862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,8,power_law_1.01,0.031673601269721983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,8,power_law_1.2,0.03255679905414581
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,1,8,power_law_1.2,0.03294079899787903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,2,1,balanced,0.06014933188756307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,2,1,balanced,0.06214933097362518
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,2,1,power_law_1.01,0.05697280168533325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,2,1,power_law_1.01,0.05768960118293762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,2,1,power_law_1.2,0.056524801254272464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,2,1,power_law_1.2,0.05798400044441223
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,4,1,balanced,0.04140799989302953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,4,1,balanced,0.043525333205858864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,4,1,power_law_1.01,0.0409280002117157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,4,1,power_law_1.01,0.04216960072517395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,4,1,power_law_1.2,0.042131200432777405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,2048,768,8,128,4,1,power_law_1.2,0.04275839924812317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,1,balanced,0.31218665838241577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,1,balanced,0.31350932518641156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,1,power_law_1.01,0.24391679763793944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,1,power_law_1.01,0.24496641159057617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,1,power_law_1.2,0.24213759899139403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,1,power_law_1.2,0.24296960830688477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,128,balanced,0.039408000806967415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,128,balanced,0.039834665755430855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,128,power_law_1.01,0.037939199805259706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,128,power_law_1.01,0.03813120126724243
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,128,power_law_1.2,0.03763839900493622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,128,power_law_1.2,0.037676799297332766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,16,balanced,0.051354666550954185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,16,balanced,0.051925331354141235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,16,power_law_1.01,0.046751999855041505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,16,power_law_1.01,0.04678399860858917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,16,power_law_1.2,0.04720639884471893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,16,power_law_1.2,0.04850560128688812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,2,balanced,0.17373865842819214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,2,balanced,0.1748746633529663
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,2,power_law_1.01,0.14634239673614502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,2,power_law_1.01,0.15073920488357545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,2,power_law_1.2,0.13804800510406495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,2,power_law_1.2,0.13991039991378784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,256,balanced,0.038160001238187156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,256,balanced,0.03923200070858002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,256,power_law_1.01,0.03585920035839081
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,256,power_law_1.01,0.03682560026645661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,256,power_law_1.2,0.035795199871063235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,256,power_law_1.2,0.03621760010719299
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,32,balanced,0.03765333443880081
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,32,balanced,0.037946666280428566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,32,power_law_1.01,0.034694400429725644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,32,power_law_1.01,0.035699200630187986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,32,power_law_1.2,0.03407360017299652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,32,power_law_1.2,0.035104000568389894
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,4,balanced,0.10488532980283101
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,4,balanced,0.10579733053843181
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,4,power_law_1.01,0.08763520121574402
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,4,power_law_1.01,0.09038720130920411
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,4,power_law_1.2,0.09351680278778077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,4,power_law_1.2,0.0961408019065857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,64,balanced,0.034160000582536064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,64,balanced,0.035461333890755974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,64,power_law_1.01,0.03285120129585266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,64,power_law_1.01,0.03457919955253601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,64,power_law_1.2,0.03322240114212036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,64,power_law_1.2,0.03372800052165985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,8,balanced,0.07036266724268596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,8,balanced,0.07038400073846181
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,8,power_law_1.01,0.061484801769256595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,8,power_law_1.01,0.06449919939041138
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,8,power_law_1.2,0.060096001625061034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,1,8,power_law_1.2,0.0648959994316101
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,2,1,balanced,0.17754666010538736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,2,1,balanced,0.17760000626246134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,2,1,power_law_1.01,0.14264320135116576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,2,1,power_law_1.01,0.14288640022277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,2,1,power_law_1.2,0.13972480297088624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,2,1,power_law_1.2,0.1412160038948059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,4,1,balanced,0.10920533537864685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,4,1,balanced,0.11012799541155498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,4,1,power_law_1.01,0.09015039801597595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,4,1,power_law_1.01,0.09147520065307617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,4,1,power_law_1.2,0.0874176025390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,4,1,power_law_1.2,0.0912447988986969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,8,1,balanced,0.08276266853014629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,8,1,balanced,0.0842026670773824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,8,1,power_law_1.01,0.06974080204963684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,8,1,power_law_1.01,0.07020800113677979
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,8,1,power_law_1.2,0.06934400200843811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,3072,1536,8,256,8,1,power_law_1.2,0.07007359862327575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,1,balanced,0.17647467056910196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,1,balanced,0.17670400937398276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,1,power_law_1.01,0.1934592008590698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,1,power_law_1.01,0.1945855975151062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,1,power_law_1.2,0.1966912031173706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,1,power_law_1.2,0.19782400131225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,2,balanced,0.08725866675376892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,2,balanced,0.08912000060081482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,2,power_law_1.01,0.10028159618377686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,2,power_law_1.01,0.1028480052947998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,2,power_law_1.2,0.10229760408401489
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,2,power_law_1.2,0.10528639554977418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,4,balanced,0.06492266555627187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,4,balanced,0.06691733499368031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,4,power_law_1.01,0.06844159960746765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,4,power_law_1.01,0.06863359808921814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,4,power_law_1.2,0.06700159907341004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,4,power_law_1.2,0.06812160015106201
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,8,balanced,0.05628266433874766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,8,balanced,0.056320001681645714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,8,power_law_1.01,0.05248000025749207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,8,power_law_1.01,0.05452160239219665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,8,power_law_1.2,0.053376001119613645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,1,8,power_law_1.2,0.05482239723205566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,16,1,balanced,0.03368533402681351
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,16,1,balanced,0.03369600077470144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,16,1,power_law_1.01,0.03371520042419433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,16,1,power_law_1.01,0.03454079926013946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,16,1,power_law_1.2,0.03338879942893982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,16,1,power_law_1.2,0.03346560001373291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,2,1,balanced,0.09697600205739339
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,2,1,balanced,0.09876799583435059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,2,1,power_law_1.01,0.10899840593338013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,2,1,power_law_1.01,0.10945279598236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,2,1,power_law_1.2,0.10880000591278076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,2,1,power_law_1.2,0.11020159721374512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,32,1,balanced,0.029466666281223297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,32,1,balanced,0.031248000760873158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,32,1,power_law_1.01,0.02956799864768982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,32,1,power_law_1.01,0.03048959970474243
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,32,1,power_law_1.2,0.029529601335525513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,32,1,power_law_1.2,0.030553600192070006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,4,1,balanced,0.06407466530799866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,4,1,balanced,0.06775466601053874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,4,1,power_law_1.01,0.06878079771995545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,4,1,power_law_1.01,0.06885120272636414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,4,1,power_law_1.2,0.06775680184364319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,4,1,power_law_1.2,0.06778879761695862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,8,1,balanced,0.047877331574757896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,8,1,balanced,0.04788800080617269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,8,1,power_law_1.01,0.0480320006608963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,8,1,power_law_1.01,0.04874880015850067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,8,1,power_law_1.2,0.04712960124015808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,14336,2,8,8,1,power_law_1.2,0.047884801030159
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,1,balanced,0.22205867369969687
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,1,balanced,0.2223893404006958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,1,power_law_1.01,0.20289280414581298
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,1,power_law_1.01,0.20583040714263917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,1,power_law_1.2,0.20585598945617675
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,1,power_law_1.2,0.20635519027709961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,128,balanced,0.03966933240493139
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,128,balanced,0.0401706670721372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,128,power_law_1.01,0.03868800103664398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,128,power_law_1.01,0.03885439932346344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,128,power_law_1.2,0.0377344012260437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,128,power_law_1.2,0.03852159976959228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,16,balanced,0.0394400010506312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,16,balanced,0.03977599988381068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,16,power_law_1.01,0.039961600303649904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,16,power_law_1.01,0.04051840007305145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,16,power_law_1.2,0.04097279906272888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,16,power_law_1.2,0.04139519929885864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,2,balanced,0.1285546620686849
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,2,balanced,0.12957866986592612
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,2,power_law_1.01,0.12011519670486451
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,2,power_law_1.01,0.12086399793624877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,2,power_law_1.2,0.12250239849090576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,2,power_law_1.2,0.12307840585708618
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,32,balanced,0.035786665976047516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,32,balanced,0.03585066646337509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,32,power_law_1.01,0.034220799803733826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,32,power_law_1.01,0.0344895988702774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,32,power_law_1.2,0.03423359990119934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,32,power_law_1.2,0.0345984011888504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,4,balanced,0.08193600177764893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,4,balanced,0.08230933547019958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,4,power_law_1.01,0.07669119834899903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,4,power_law_1.01,0.07811840176582337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,4,power_law_1.2,0.07806079983711242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,4,power_law_1.2,0.08075519800186157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,64,balanced,0.04178666571776072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,64,balanced,0.04215466479460398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,64,power_law_1.01,0.03887999951839447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,64,power_law_1.01,0.04048640131950378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,64,power_law_1.2,0.04023680090904236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,64,power_law_1.2,0.04030719995498657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,8,balanced,0.058261334896087646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,8,balanced,0.05949866771697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,8,power_law_1.01,0.05505920052528381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,8,power_law_1.01,0.055615997314453124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,8,power_law_1.2,0.05613440275192261
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,1,8,power_law_1.2,0.0562175989151001
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,2,1,balanced,0.1320746640364329
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,2,1,balanced,0.13235200444857279
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,2,1,power_law_1.01,0.12067199945449829
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,2,1,power_law_1.01,0.12378239631652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,2,1,power_law_1.2,0.12314879894256592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,2,1,power_law_1.2,0.12658560276031494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,4,1,balanced,0.08674133817354839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,4,1,balanced,0.08685333530108134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,4,1,power_law_1.01,0.08140159845352173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,4,1,power_law_1.01,0.0816703975200653
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,4,1,power_law_1.2,0.08075519800186157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,4,1,power_law_1.2,0.0839743971824646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,8,1,balanced,0.06613333523273468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,8,1,balanced,0.0676693320274353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,8,1,power_law_1.01,0.06362879872322083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,8,1,power_law_1.01,0.06421120166778564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,8,1,power_law_1.2,0.06376320123672485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,4096,1536,8,128,8,1,power_law_1.2,0.06437119841575623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,1,balanced,0.3588586648305257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,1,balanced,0.35939733187357586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,1,power_law_1.01,0.413862419128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,1,power_law_1.01,0.42407679557800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,1,power_law_1.2,0.39866878986358645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,1,power_law_1.2,0.4123392105102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,2,balanced,0.1291253368059794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,2,balanced,0.13224533200263977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,2,power_law_1.01,0.17407360076904296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,2,power_law_1.01,0.18142080307006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,2,power_law_1.2,0.18157440423965454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,2,power_law_1.2,0.1815999984741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,4,balanced,0.08499733606974284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,4,balanced,0.08504533767700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,4,power_law_1.01,0.09719679951667785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,4,power_law_1.01,0.10199040174484253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,4,power_law_1.2,0.09839360117912292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,4,power_law_1.2,0.09902719855308532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,8,balanced,0.08692800005276997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,8,balanced,0.08771199981371562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,8,power_law_1.01,0.0659712016582489
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,8,power_law_1.01,0.06996480226516724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,8,power_law_1.2,0.06639360189437866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,1,8,power_law_1.2,0.06645119786262513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,16,1,balanced,0.04365866879622141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,16,1,balanced,0.04472533365090688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,16,1,power_law_1.01,0.04467839896678925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,16,1,power_law_1.01,0.04528000056743622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,16,1,power_law_1.2,0.045126399397850035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,16,1,power_law_1.2,0.045151999592781066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,2,1,balanced,0.14612799882888794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,2,1,balanced,0.14686933159828186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,2,1,power_law_1.01,0.16751359701156615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,2,1,power_law_1.01,0.16980479955673217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,2,1,power_law_1.2,0.16690560579299926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,2,1,power_law_1.2,0.17222399711608888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,32,1,balanced,0.03323200096686681
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,32,1,balanced,0.03365866591533025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,32,1,power_law_1.01,0.034431999921798705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,32,1,power_law_1.01,0.03478400111198425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,32,1,power_law_1.2,0.03356159925460815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,32,1,power_law_1.2,0.033817601203918454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,4,1,balanced,0.0916266640027364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,4,1,balanced,0.09388800462086995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,4,1,power_law_1.01,0.09589120149612426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,4,1,power_law_1.01,0.10121599435806275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,4,1,power_law_1.2,0.09621120095252991
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,4,1,power_law_1.2,0.09739519953727722
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,8,1,balanced,0.062133332093556724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,8,1,balanced,0.062309334675470986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,8,1,power_law_1.01,0.06277120113372803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,8,1,power_law_1.01,0.0634112000465393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,8,1,power_law_1.2,0.06282879710197449
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,16384,2,8,8,1,power_law_1.2,0.06403840184211732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,1,balanced,0.7812053362528483
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,1,balanced,0.781440019607544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,1,power_law_1.01,0.6048255920410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,1,power_law_1.01,0.6132800102233886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,1,power_law_1.2,0.5837056159973144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,1,power_law_1.2,0.5912511825561524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,128,balanced,0.07672533392906189
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,128,balanced,0.0787360022465388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,128,power_law_1.01,0.07389439940452576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,128,power_law_1.01,0.07488639950752259
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,128,power_law_1.2,0.07341439723968506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,128,power_law_1.2,0.07557759881019592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,16,balanced,0.08449066678682964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,16,balanced,0.08502399921417236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,16,power_law_1.01,0.07336320281028748
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,16,power_law_1.01,0.07799680233001709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,16,power_law_1.2,0.07747840285301208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,16,power_law_1.2,0.07967360019683838
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,2,balanced,0.40748266379038495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,2,balanced,0.41124268372853595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,2,power_law_1.01,0.3156928062438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,2,power_law_1.01,0.32769920825958254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,2,power_law_1.2,0.3122688055038452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,2,power_law_1.2,0.32902400493621825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,256,balanced,0.05826666454474131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,256,balanced,0.05827199916044871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,256,power_law_1.01,0.05440639853477478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,256,power_law_1.01,0.05735679864883423
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,256,power_law_1.2,0.054451197385787964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,256,power_law_1.2,0.05475839972496033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,32,balanced,0.059749335050582886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,32,balanced,0.06113066772619883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,32,power_law_1.01,0.058259201049804685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,32,power_law_1.01,0.061401599645614625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,32,power_law_1.2,0.05912320017814636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,32,power_law_1.2,0.05948160290718078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,4,balanced,0.22375466426213583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,4,balanced,0.22509332497914633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,4,power_law_1.01,0.19443199634552003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,4,power_law_1.01,0.1994879961013794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,4,power_law_1.2,0.17181440591812133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,4,power_law_1.2,0.19196799993515015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,64,balanced,0.05932266513506571
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,64,balanced,0.06060799956321716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,64,power_law_1.01,0.055980801582336426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,64,power_law_1.01,0.05761920213699341
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,64,power_law_1.2,0.05262719988822937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,64,power_law_1.2,0.05556480288505554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,8,balanced,0.1321333348751068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,8,balanced,0.1334826648235321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,8,power_law_1.01,0.11399040222167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,8,power_law_1.01,0.12097920179367065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,8,power_law_1.2,0.11103359460830689
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,1,8,power_law_1.2,0.11895040273666382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,16,1,balanced,0.10883733630180359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,16,1,balanced,0.10935999949773152
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,16,1,power_law_1.01,0.09086719751358033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,16,1,power_law_1.01,0.091839998960495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,16,1,power_law_1.2,0.09136000275611877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,16,1,power_law_1.2,0.09196799993515015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,2,1,balanced,0.4107733170191447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,2,1,balanced,0.4117279847462972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,2,1,power_law_1.01,0.31038079261779783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,2,1,power_law_1.01,0.3178623914718628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,2,1,power_law_1.2,0.3103424072265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,2,1,power_law_1.2,0.3164736032485962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,32,1,balanced,0.09166399637858073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,32,1,balanced,0.09222933650016785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,32,1,power_law_1.01,0.07888640165328979
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,32,1,power_law_1.01,0.07935360074043274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,32,1,power_law_1.2,0.0790336012840271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,32,1,power_law_1.2,0.0791487991809845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,4,1,balanced,0.22827200094858804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,4,1,balanced,0.2283680041631063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,4,1,power_law_1.01,0.17994240522384644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,4,1,power_law_1.01,0.1813696026802063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,4,1,power_law_1.2,0.17626240253448486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,4,1,power_law_1.2,0.17696640491485596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,8,1,balanced,0.14225600163141885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,8,1,balanced,0.14249599973360697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,8,1,power_law_1.01,0.11743999719619751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,8,1,power_law_1.01,0.11783039569854736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,8,1,power_law_1.2,0.1185215950012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2048,8,256,8,1,power_law_1.2,0.11857279539108276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,1,balanced,0.6185386578241984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,1,balanced,0.6209439833958944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,1,power_law_1.01,0.529753589630127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,1,power_law_1.01,0.5360896110534668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,1,power_law_1.2,0.5287231922149658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,1,power_law_1.2,0.5406015872955322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,16,balanced,0.07531733314196269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,16,balanced,0.07653333246707916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,16,power_law_1.01,0.07226240038871765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,16,power_law_1.01,0.07279999852180481
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,16,power_law_1.2,0.0719488024711609
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,16,power_law_1.2,0.07274879813194275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,2,balanced,0.32876267035802204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,2,balanced,0.3293493390083313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,2,power_law_1.01,0.2947200059890747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,2,power_law_1.01,0.29684479236602784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,2,power_law_1.2,0.2832256078720093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,2,power_law_1.2,0.2938175916671753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,32,balanced,0.08053333560625713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,32,balanced,0.0816480020682017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,32,power_law_1.01,0.07461760044097901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,32,power_law_1.01,0.07509120106697083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,32,power_law_1.2,0.06682239770889283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,32,power_law_1.2,0.07015680074691773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,4,balanced,0.1836479902267456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,4,balanced,0.18385066588719687
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,4,power_law_1.01,0.159552001953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,4,power_law_1.01,0.17062400579452514
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,4,power_law_1.2,0.16764160394668579
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,4,power_law_1.2,0.17505919933319092
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,8,balanced,0.11197333534558614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,8,balanced,0.11276266972223918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,8,power_law_1.01,0.10103679895401001
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,8,power_law_1.01,0.10502400398254394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,8,power_law_1.2,0.10093439817428589
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,1,8,power_law_1.2,0.10546560287475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,2,1,balanced,0.3327839970588684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,2,1,balanced,0.33345067501068115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,2,1,power_law_1.01,0.28608639240264894
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,2,1,power_law_1.01,0.2940160036087036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,2,1,power_law_1.2,0.2923775911331177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,2,1,power_law_1.2,0.2963583946228027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,4,1,balanced,0.19356266657511392
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,4,1,balanced,0.19395732879638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,4,1,power_law_1.01,0.17070080041885377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,4,1,power_law_1.01,0.1724992036819458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,4,1,power_law_1.2,0.17169920206069947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,4,1,power_law_1.2,0.17626880407333373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,8,1,balanced,0.11803199847539265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,8,1,balanced,0.11946133772532146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,8,1,power_law_1.01,0.1082111954689026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,8,1,power_law_1.01,0.1098431944847107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,8,1,power_law_1.2,0.108787202835083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,6144,2560,8,160,8,1,power_law_1.2,0.10945279598236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,1,balanced,0.9060479799906412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,1,balanced,0.9068373044331869
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,1,power_law_1.01,0.6926527976989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,1,power_law_1.01,0.693120002746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,1,power_law_1.2,0.679859209060669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,1,power_law_1.2,0.682809591293335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,128,balanced,0.05208533505598704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,128,balanced,0.053957333167394005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,128,power_law_1.01,0.049932798743247984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,128,power_law_1.01,0.050758397579193114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,128,power_law_1.2,0.04963839948177338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,128,power_law_1.2,0.05087360143661499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,16,balanced,0.09286399682362874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,16,balanced,0.09514133135477702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,16,power_law_1.01,0.08247680068016053
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,16,power_law_1.01,0.08680319786071777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,16,power_law_1.2,0.08715519905090333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,16,power_law_1.2,0.08725119829177856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,2,balanced,0.47141865889231366
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,2,balanced,0.47375468413035077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,2,power_law_1.01,0.384716796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,2,power_law_1.01,0.3919615983963013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,2,power_law_1.2,0.3871680021286011
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,2,power_law_1.2,0.4001920223236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,256,balanced,0.044677332043647766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,256,balanced,0.04589866598447164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,256,power_law_1.01,0.04361599981784821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,256,power_law_1.01,0.04444159865379334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,256,power_law_1.2,0.04304639995098114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,256,power_law_1.2,0.0448063999414444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,32,balanced,0.06565333406130473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,32,balanced,0.06589333216349284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,32,power_law_1.01,0.06280959844589233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,32,power_law_1.01,0.06321920156478882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,32,power_law_1.2,0.06088320016860962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,32,power_law_1.2,0.06339840292930603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,4,balanced,0.25575466950734455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,4,balanced,0.2571840087572734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,4,power_law_1.01,0.22081279754638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,4,power_law_1.01,0.23296639919281006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,4,power_law_1.2,0.2114176034927368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,4,power_law_1.2,0.22639360427856445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,64,balanced,0.054058666030565895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,64,balanced,0.05497066676616669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,64,power_law_1.01,0.05203199982643127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,64,power_law_1.01,0.052748799324035645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,64,power_law_1.2,0.048153600096702574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,64,power_law_1.2,0.049491199851036075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,8,balanced,0.14789332946141562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,8,balanced,0.14921599626541138
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,8,power_law_1.01,0.13242239952087403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,8,power_law_1.01,0.13549439907073973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,8,power_law_1.2,0.12138240337371826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,1,8,power_law_1.2,0.12823679447174072
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,16,1,balanced,0.12152533729871114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,16,1,balanced,0.12268267075220744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,16,1,power_law_1.01,0.10221439599990845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,16,1,power_law_1.01,0.10323840379714966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,16,1,power_law_1.2,0.10140800476074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,16,1,power_law_1.2,0.10303360223770142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,2,1,balanced,0.4724586804707845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,2,1,balanced,0.47654934724171955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,2,1,power_law_1.01,0.3647615909576416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,2,1,power_law_1.01,0.36620800495147704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,2,1,power_law_1.2,0.35829761028289797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,2,1,power_law_1.2,0.35936000347137453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,32,1,balanced,0.10260799527168274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,32,1,balanced,0.1032373309135437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,32,1,power_law_1.01,0.0869055986404419
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,32,1,power_law_1.01,0.08892800211906433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,32,1,power_law_1.2,0.0886784017086029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,32,1,power_law_1.2,0.0899071991443634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,4,1,balanced,0.2603093385696411
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,4,1,balanced,0.26043200492858887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,4,1,power_law_1.01,0.20861439704895018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,4,1,power_law_1.01,0.21001598834991456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,4,1,power_law_1.2,0.2044287919998169
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,4,1,power_law_1.2,0.20589439868927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,8,1,balanced,0.16085333625475565
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,8,1,balanced,0.1623093287150065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,8,1,power_law_1.01,0.13189760446548462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,8,1,power_law_1.01,0.1331264019012451
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,8,1,power_law_1.2,0.12905600070953369
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,256,8,1,power_law_1.2,0.1339840054512024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,1,balanced,1.3325973351796467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,1,balanced,1.3330453236897786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,1,power_law_1.01,0.8967552185058594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,1,power_law_1.01,0.9015744209289551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,1,power_law_1.2,0.868006420135498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,1,power_law_1.2,0.8709376335144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,128,balanced,0.060175999999046326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,128,balanced,0.06228266656398773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,128,power_law_1.01,0.05734400153160095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,128,power_law_1.01,0.05975040197372437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,128,power_law_1.2,0.05875840187072754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,128,power_law_1.2,0.058815997838973996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,16,balanced,0.12282666563987732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,16,balanced,0.12291199962298076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,16,power_law_1.01,0.10367360115051269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,16,power_law_1.01,0.1094655990600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,16,power_law_1.2,0.10549759864807129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,16,power_law_1.2,0.1089087963104248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,2,balanced,0.6840799649556478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,2,balanced,0.6860799789428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,2,power_law_1.01,0.5144000053405762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,2,power_law_1.01,0.5214911937713623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,2,power_law_1.2,0.49147520065307615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,2,power_law_1.2,0.51146240234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,32,balanced,0.08030933141708374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,32,balanced,0.08220799763997395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,32,power_law_1.01,0.07249280214309692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,32,power_law_1.01,0.07578880190849305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,32,power_law_1.2,0.06969599723815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,32,power_law_1.2,0.07487360239028931
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,4,balanced,0.3608959913253784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,4,balanced,0.3630613485972087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,4,power_law_1.01,0.2823744058609009
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,4,power_law_1.01,0.3031552076339722
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,4,power_law_1.2,0.3054975986480713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,4,power_law_1.2,0.3277184009552002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,64,balanced,0.06674133241176605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,64,balanced,0.06824000179767609
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,64,power_law_1.01,0.0636031985282898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,64,power_law_1.01,0.06451839804649354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,64,power_law_1.2,0.05554559826850891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,64,power_law_1.2,0.06453120112419128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,8,balanced,0.20204800367355347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,8,balanced,0.20295999447504678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,8,power_law_1.01,0.16465920209884644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,8,power_law_1.01,0.17034239768981935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,8,power_law_1.2,0.17704319953918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,1,8,power_law_1.2,0.18934400081634523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,16,1,balanced,0.16116266449292502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,16,1,balanced,0.16245333353678384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,16,1,power_law_1.01,0.12442879676818848
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,16,1,power_law_1.01,0.12595200538635254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,16,1,power_law_1.2,0.12291200160980224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,16,1,power_law_1.2,0.12390400171279907
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,2,1,balanced,0.6863946914672852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,2,1,balanced,0.6878399848937988
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,2,1,power_law_1.01,0.47091197967529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,2,1,power_law_1.01,0.4774911880493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,2,1,power_law_1.2,0.45518717765808103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,2,1,power_law_1.2,0.45866241455078127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,32,1,balanced,0.1337440013885498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,32,1,balanced,0.1346560021241506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,32,1,power_law_1.01,0.10406399965286255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,32,1,power_law_1.01,0.1040768027305603
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,32,1,power_law_1.2,0.10207359790802002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,32,1,power_law_1.2,0.10454399585723877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,4,1,balanced,0.3661493460337321
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,4,1,balanced,0.3693813482920329
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,4,1,power_law_1.01,0.25852160453796386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,4,1,power_law_1.01,0.2606015920639038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,4,1,power_law_1.2,0.25397119522094724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,4,1,power_law_1.2,0.25474560260772705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,8,1,balanced,0.21870400508244833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,8,1,balanced,0.220634659131368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,8,1,power_law_1.01,0.16352640390396117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,8,1,power_law_1.01,0.16407040357589722
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,8,1,power_law_1.2,0.15932799577713014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,64,7168,2048,8,384,8,1,power_law_1.2,0.16053760051727295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,1,balanced,0.1122773289680481
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,1,balanced,0.11339199542999268
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,1,power_law_1.01,0.11482239961624145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,1,power_law_1.01,0.11638400554656983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,1,power_law_1.2,0.11689599752426147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,1,power_law_1.2,0.1184000015258789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,128,balanced,0.04050666590531667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,128,balanced,0.04128533353408178
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,128,power_law_1.01,0.03992320001125336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,128,power_law_1.01,0.04017280042171478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,128,power_law_1.2,0.03920640051364899
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,128,power_law_1.2,0.03961600065231323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,16,balanced,0.04186666508515676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,16,balanced,0.04204266766707102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,16,power_law_1.01,0.04203520119190216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,16,power_law_1.01,0.042822399735450746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,16,power_law_1.2,0.043584001064300534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,16,power_law_1.2,0.04467839896678925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,2,balanced,0.07201066613197327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,2,balanced,0.07248533268769582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,2,power_law_1.01,0.07517439723014832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,2,power_law_1.01,0.07991039752960205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,2,power_law_1.2,0.07869439721107482
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,2,power_law_1.2,0.07959679961204529
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,32,balanced,0.04186666508515676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,32,balanced,0.04188799858093262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,32,power_law_1.01,0.04066559970378876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,32,power_law_1.01,0.04147840142250061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,32,power_law_1.2,0.04073599874973297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,32,power_law_1.2,0.04108799993991852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,4,balanced,0.07657599945863088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,4,balanced,0.0792799989382426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,4,power_law_1.01,0.07151359915733338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,4,power_law_1.01,0.07240960001945496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,4,power_law_1.2,0.0730239987373352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,4,power_law_1.2,0.07831680178642272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,64,balanced,0.040778666734695435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,64,balanced,0.04167999823888143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,64,power_law_1.01,0.04017919898033142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,64,power_law_1.01,0.040550398826599124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,64,power_law_1.2,0.03978239893913269
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,64,power_law_1.2,0.0403328001499176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,8,balanced,0.049135997891426086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,8,balanced,0.049600000182787575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,8,power_law_1.01,0.05103999972343445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,8,power_law_1.01,0.051481598615646364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,8,power_law_1.2,0.0530239999294281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,1,8,power_law_1.2,0.05319679975509643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,2,1,balanced,0.08422933022181193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,2,1,balanced,0.08473066488901775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,2,1,power_law_1.01,0.08440960049629212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,2,1,power_law_1.01,0.0850048005580902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,2,1,power_law_1.2,0.08488960266113281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,2,1,power_law_1.2,0.08592000007629394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,4,1,balanced,0.06811200082302094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,4,1,balanced,0.0697813332080841
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,4,1,power_law_1.01,0.06815360188484192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,4,1,power_law_1.01,0.06903039813041686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,4,1,power_law_1.2,0.0695039987564087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,2048,768,8,128,4,1,power_law_1.2,0.07009279727935791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,1,balanced,0.3717600107192993
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,1,balanced,0.37269333998362225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,1,power_law_1.01,0.38302719593048096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,1,power_law_1.01,0.3895103931427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,1,power_law_1.2,0.39479680061340333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,1,power_law_1.2,0.4010176181793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,128,balanced,0.04558933277924856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,128,balanced,0.045696000258127846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,128,power_law_1.01,0.04455040097236633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,128,power_law_1.01,0.044710400700569156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,128,power_law_1.2,0.04451839923858643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,128,power_law_1.2,0.045132800936698914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,16,balanced,0.06942933301130931
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,16,balanced,0.07035199801127116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,16,power_law_1.01,0.06766080260276794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,16,power_law_1.01,0.07008000016212464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,16,power_law_1.2,0.06941440105438232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,16,power_law_1.2,0.0710591971874237
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,2,balanced,0.19086933135986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,2,balanced,0.19151999553044638
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,2,power_law_1.01,0.19523839950561522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,2,power_law_1.01,0.1953279972076416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,2,power_law_1.2,0.20373759269714356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,2,power_law_1.2,0.2052608013153076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,256,balanced,0.04602666695912679
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,256,balanced,0.046069333950678505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,256,power_law_1.01,0.043993601202964784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,256,power_law_1.01,0.044377601146698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,256,power_law_1.2,0.04392960071563721
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,256,power_law_1.2,0.04398080110549927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,32,balanced,0.05388266841570536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,32,balanced,0.054010664423306785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,32,power_law_1.01,0.05433599948883057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,32,power_law_1.01,0.05494400262832642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,32,power_law_1.2,0.055257600545883176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,32,power_law_1.2,0.05598719716072083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,4,balanced,0.14040533701578775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,4,balanced,0.14114666978518167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,4,power_law_1.01,0.11893759965896607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,4,power_law_1.01,0.12052479982376099
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,4,power_law_1.2,0.12416640520095826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,4,power_law_1.2,0.13248640298843384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,64,balanced,0.04700266818205515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,64,balanced,0.04758933186531067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,64,power_law_1.01,0.046963199973106384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,64,power_law_1.01,0.04696959853172302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,64,power_law_1.2,0.047539201378822324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,64,power_law_1.2,0.048153600096702574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,8,balanced,0.1622880001862844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,8,balanced,0.16897600889205933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,8,power_law_1.01,0.1141759991645813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,8,power_law_1.01,0.1211967945098877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,8,power_law_1.2,0.1155519962310791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,1,8,power_law_1.2,0.11758079528808593
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,2,1,balanced,0.23004267613093057
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,2,1,balanced,0.23057599862416586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,2,1,power_law_1.01,0.23066239356994628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,2,1,power_law_1.01,0.2340928077697754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,2,1,power_law_1.2,0.23905279636383056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,2,1,power_law_1.2,0.24175360202789306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,4,1,balanced,0.1523253321647644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,4,1,balanced,0.15242133537928262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,4,1,power_law_1.01,0.14755200147628783
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,4,1,power_law_1.01,0.1484544038772583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,4,1,power_law_1.2,0.1523200035095215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,4,1,power_law_1.2,0.15327999591827393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,8,1,balanced,0.12139200170834859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,8,1,balanced,0.12200533350308736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,8,1,power_law_1.01,0.11697920560836791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,8,1,power_law_1.01,0.1185215950012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,8,1,power_law_1.2,0.12010879516601562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,3072,1536,8,256,8,1,power_law_1.2,0.12082560062408447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,1,balanced,0.5957226753234863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,1,balanced,0.5967199802398682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,1,power_law_1.01,0.2987391948699951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,1,power_law_1.01,0.30782721042633054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,1,power_law_1.2,0.3000447988510132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,1,power_law_1.2,0.306931209564209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,2,balanced,0.2700960040092468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,2,balanced,0.2704266707102458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,2,power_law_1.01,0.19720959663391113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,2,power_law_1.01,0.24099841117858886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,2,power_law_1.2,0.1993600010871887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,2,power_law_1.2,0.21011838912963868
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,4,balanced,0.10609066486358643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,4,balanced,0.1076639990011851
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,4,power_law_1.01,0.15649280548095704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,4,power_law_1.01,0.1606528043746948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,4,power_law_1.2,0.14375679492950438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,4,power_law_1.2,0.15771520137786865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,8,balanced,0.08576533198356628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,8,balanced,0.08708266417185466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,8,power_law_1.01,0.11984000205993653
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,8,power_law_1.01,0.1282688021659851
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,8,power_law_1.2,0.12632319927215577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,1,8,power_law_1.2,0.12762880325317383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,16,1,balanced,0.08084799846013387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,16,1,balanced,0.0820000022649765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,16,1,power_law_1.01,0.06160640120506287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,16,1,power_law_1.01,0.062431997060775755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,16,1,power_law_1.2,0.0586624026298523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,16,1,power_law_1.2,0.059680002927780154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,2,1,balanced,0.3201333284378052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,2,1,balanced,0.3263733386993408
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,2,1,power_law_1.01,0.16891520023345946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,2,1,power_law_1.01,0.2143359899520874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,2,1,power_law_1.2,0.16320639848709106
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,2,1,power_law_1.2,0.17616000175476074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,32,1,balanced,0.056090667843818665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,32,1,balanced,0.060047999024391174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,32,1,power_law_1.01,0.05125759840011597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,32,1,power_law_1.01,0.052985602617263795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,32,1,power_law_1.2,0.05115519762039185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,32,1,power_law_1.2,0.051744002103805545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,4,1,balanced,0.1846346656481425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,4,1,balanced,0.1904159982999166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,4,1,power_law_1.01,0.11303039789199829
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,4,1,power_law_1.01,0.11392639875411988
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,4,1,power_law_1.2,0.10560640096664428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,4,1,power_law_1.2,0.10562560558319092
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,8,1,balanced,0.1144480009873708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,8,1,balanced,0.11987200379371643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,8,1,power_law_1.01,0.077920001745224
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,8,1,power_law_1.01,0.07930240035057068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,8,1,power_law_1.2,0.07793279886245727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,14336,2,8,8,1,power_law_1.2,0.08433279991149903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,1,balanced,0.29949865738550824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,1,balanced,0.3001439968744914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,1,power_law_1.01,0.3153984069824219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,1,power_law_1.01,0.3173952102661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,1,power_law_1.2,0.32522239685058596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,1,power_law_1.2,0.3321280002593994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,128,balanced,0.04911466439565023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,128,balanced,0.04922133187452952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,128,power_law_1.01,0.04850560128688812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,128,power_law_1.01,0.048518401384353635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,128,power_law_1.2,0.048895999789237976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,128,power_law_1.2,0.04989440143108368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,16,balanced,0.0643093337615331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,16,balanced,0.06507733464241028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,16,power_law_1.01,0.06615039706230164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,16,power_law_1.01,0.06720640063285828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,16,power_law_1.2,0.06969599723815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,16,power_law_1.2,0.07067520022392274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,2,balanced,0.1569813291231791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,2,balanced,0.15717333555221558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,2,power_law_1.01,0.1667904019355774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,2,power_law_1.01,0.17445759773254393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,2,power_law_1.2,0.17541760206222534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,2,power_law_1.2,0.178656005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,32,balanced,0.04984533290068308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,32,balanced,0.0499946673711141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,32,power_law_1.01,0.0561024010181427
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,32,power_law_1.01,0.05991680026054382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,32,power_law_1.2,0.057107198238372806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,32,power_law_1.2,0.05738239884376526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,4,balanced,0.18000533183415732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,4,balanced,0.1882773240407308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,4,power_law_1.01,0.13808640241622924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,4,power_law_1.01,0.17434240579605104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,4,power_law_1.2,0.13411200046539307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,4,power_law_1.2,0.141702401638031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,64,balanced,0.04794666667779287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,64,balanced,0.04906666775544485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,64,power_law_1.01,0.048537600040435794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,64,power_law_1.01,0.05023999810218811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,64,power_law_1.2,0.05077760219573975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,64,power_law_1.2,0.05161600112915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,8,balanced,0.08241599798202515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,8,balanced,0.08295999964078267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,8,power_law_1.01,0.08549759984016418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,8,power_law_1.01,0.08577280044555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,8,power_law_1.2,0.08485119938850402
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,1,8,power_law_1.2,0.09258880019187928
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,2,1,balanced,0.1861600081125895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,2,1,balanced,0.18765334288279215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,2,1,power_law_1.01,0.1979200005531311
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,2,1,power_law_1.01,0.19996800422668456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,2,1,power_law_1.2,0.19843839406967162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,2,1,power_law_1.2,0.20142719745635987
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,4,1,balanced,0.13105600078900656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,4,1,balanced,0.133242666721344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,4,1,power_law_1.01,0.1330623984336853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,4,1,power_law_1.01,0.13392000198364257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,4,1,power_law_1.2,0.13489919900894165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,4,1,power_law_1.2,0.1352255940437317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,8,1,balanced,0.10594133536020915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,8,1,balanced,0.10690133770306905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,8,1,power_law_1.01,0.10557440519332886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,8,1,power_law_1.01,0.1056447982788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,8,1,power_law_1.2,0.10544639825820923
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,4096,1536,8,128,8,1,power_law_1.2,0.10629119873046874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,1,balanced,0.7918506463368734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,1,balanced,0.7983520030975342
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,1,power_law_1.01,0.47171840667724607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,1,power_law_1.01,0.5083839893341064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,1,power_law_1.2,0.4665664196014404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,1,power_law_1.2,0.4800447940826416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,2,balanced,0.37223998705546063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,2,balanced,0.37548800309499103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,2,power_law_1.01,0.2874943971633911
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,2,power_law_1.01,0.3197824001312256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,2,power_law_1.2,0.34955520629882814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,2,power_law_1.2,0.35844480991363525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,4,balanced,0.16023466984430948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,4,balanced,0.1611253321170807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,4,power_law_1.01,0.22913920879364014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,4,power_law_1.01,0.23876481056213378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,4,power_law_1.2,0.22190721035003663
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,4,power_law_1.2,0.2353600025177002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,8,balanced,0.1051573355992635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,8,balanced,0.1065120001633962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,8,power_law_1.01,0.17200000286102296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,8,power_law_1.01,0.17984000444412232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,8,power_law_1.2,0.17086080312728882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,1,8,power_law_1.2,0.17396479845046997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,16,1,balanced,0.09939199686050415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,16,1,balanced,0.10318400462468465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,16,1,power_law_1.01,0.07626879811286927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,16,1,power_law_1.01,0.0778432011604309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,16,1,power_law_1.2,0.07672320008277893
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,16,1,power_law_1.2,0.07783039808273315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,2,1,balanced,0.4093386729558309
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,2,1,balanced,0.40996265411376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,2,1,power_law_1.01,0.2534847974777222
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,2,1,power_law_1.01,0.2671488046646118
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,2,1,power_law_1.2,0.25824000835418703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,2,1,power_law_1.2,0.2689215898513794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,32,1,balanced,0.07092266778151195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,32,1,balanced,0.07630933324495952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,32,1,power_law_1.01,0.0649407982826233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,32,1,power_law_1.01,0.06527360081672669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,32,1,power_law_1.2,0.0632960021495819
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,32,1,power_law_1.2,0.0671231985092163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,4,1,balanced,0.2360586722691854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,4,1,balanced,0.23837866385777792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,4,1,power_law_1.01,0.14907519817352294
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,4,1,power_law_1.01,0.1615615963935852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,4,1,power_law_1.2,0.16306560039520263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,4,1,power_law_1.2,0.177401602268219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,8,1,balanced,0.1453973352909088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,8,1,balanced,0.14543466766675314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,8,1,power_law_1.01,0.10824960470199585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,8,1,power_law_1.01,0.10858240127563476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,8,1,power_law_1.2,0.10440959930419921
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,16384,2,8,8,1,power_law_1.2,0.10774400234222412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,1,balanced,0.9252213637034098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,1,balanced,0.9302826722462972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,1,power_law_1.01,0.9643775939941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,1,power_law_1.01,0.9730112075805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,1,power_law_1.2,1.0236607551574708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,1,power_law_1.2,1.025228786468506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,128,balanced,0.05659733215967814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,128,balanced,0.057162667314211525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,128,power_law_1.01,0.05782399773597717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,128,power_law_1.01,0.05898879766464234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,128,power_law_1.2,0.060070401430130003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,128,power_law_1.2,0.06062080264091492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,16,balanced,0.11768000324567159
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,16,balanced,0.11897599697113037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,16,power_law_1.01,0.11369600296020507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,16,power_law_1.01,0.11448960304260254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,16,power_law_1.2,0.1182144045829773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,16,power_law_1.2,0.12342400550842285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,2,balanced,0.4421173334121704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,2,balanced,0.44299201170603436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,2,power_law_1.01,0.4403007984161377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,2,power_law_1.01,0.4576000213623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,2,power_law_1.2,0.47996158599853517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,2,power_law_1.2,0.4925824165344238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,256,balanced,0.05609600245952606
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,256,balanced,0.056362668673197426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,256,power_law_1.01,0.05559679865837097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,256,power_law_1.01,0.05564799904823303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,256,power_law_1.2,0.054585599899291994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,256,power_law_1.2,0.05748479962348938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,32,balanced,0.08902399738629659
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,32,balanced,0.0909493366877238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,32,power_law_1.01,0.08633599877357483
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,32,power_law_1.01,0.08841599822044373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,32,power_law_1.2,0.08565120100975036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,32,power_law_1.2,0.09007359743118286
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,4,balanced,0.2882186571756999
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,4,balanced,0.2911840081214905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,4,power_law_1.01,0.2582463979721069
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,4,power_law_1.01,0.2668159961700439
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,4,power_law_1.2,0.2713536024093628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,4,power_law_1.2,0.27815680503845214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,64,balanced,0.07027199864387512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,64,balanced,0.07084799806276958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,64,power_law_1.01,0.07272959947586059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,64,power_law_1.01,0.07365760207176208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,64,power_law_1.2,0.07548159956932068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,64,power_law_1.2,0.07612800002098083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,8,balanced,0.3206453323364258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,8,balanced,0.32790933052698773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,8,power_law_1.01,0.21301119327545165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,8,power_law_1.01,0.22695679664611818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,8,power_law_1.2,0.2275264024734497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,1,8,power_law_1.2,0.2570751905441284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,16,1,balanced,0.1795253356297811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,16,1,balanced,0.18051199118296304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,16,1,power_law_1.01,0.17980799674987794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,16,1,power_law_1.01,0.18033280372619628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,16,1,power_law_1.2,0.18341120481491088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,16,1,power_law_1.2,0.18380160331726075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,2,1,balanced,0.4974506696065267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,2,1,balanced,0.49803733825683594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,2,1,power_law_1.01,0.5066112041473388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,2,1,power_law_1.01,0.5089280128479003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,2,1,power_law_1.2,0.5313600063323974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,2,1,power_law_1.2,0.5382271766662597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,32,1,balanced,0.16218666235605875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,32,1,balanced,0.1623093287150065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,32,1,power_law_1.01,0.1602687954902649
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,32,1,power_law_1.01,0.16046719551086425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,32,1,power_law_1.2,0.16122879981994628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,32,1,power_law_1.2,0.16357760429382323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,4,1,balanced,0.3045919934908549
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,4,1,balanced,0.30740267038345337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,4,1,power_law_1.01,0.3020096063613892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,4,1,power_law_1.01,0.3030463933944702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,4,1,power_law_1.2,0.3158911943435669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,4,1,power_law_1.2,0.31867520809173583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,8,1,balanced,0.2146773338317871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,8,1,balanced,0.2155946691830953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,8,1,power_law_1.01,0.21454720497131347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,8,1,power_law_1.01,0.2147968053817749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,8,1,power_law_1.2,0.217305588722229
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2048,8,256,8,1,power_law_1.2,0.22072319984436034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,1,balanced,0.7979253133138021
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,1,balanced,0.8013813495635986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,1,power_law_1.01,0.801632022857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,1,power_law_1.01,0.8029439926147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,1,power_law_1.2,0.8290687561035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,1,power_law_1.2,0.829798412322998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,16,balanced,0.10244799653689067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,16,balanced,0.10397866368293762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,16,power_law_1.01,0.10828160047531128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,16,power_law_1.01,0.11208959817886352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,16,power_law_1.2,0.11107840538024902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,16,power_law_1.2,0.11340160369873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,2,balanced,0.3979039986928304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,2,balanced,0.398853341738383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,2,power_law_1.01,0.40480642318725585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,2,power_law_1.01,0.40604801177978517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,2,power_law_1.2,0.4236288070678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,2,power_law_1.2,0.4347008228302002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,32,balanced,0.08311466872692108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,32,balanced,0.08481066425641377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,32,power_law_1.01,0.08391680121421814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,32,power_law_1.01,0.08542079925537109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,32,power_law_1.2,0.08609920144081115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,32,power_law_1.2,0.08821120262145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,4,balanced,0.502784013748169
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,4,balanced,0.5042239824930826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,4,power_law_1.01,0.34898560047149657
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,4,power_law_1.01,0.39738879203796384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,4,power_law_1.2,0.3215872049331665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,4,power_law_1.2,0.3307391881942749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,8,balanced,0.150325338045756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,8,balanced,0.1513653298219045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,8,power_law_1.01,0.15768320560455323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,8,power_law_1.01,0.16647679805755616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,8,power_law_1.2,0.18064639568328858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,1,8,power_law_1.2,0.1873471975326538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,2,1,balanced,0.4498879909515381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,2,1,balanced,0.45076799392700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,2,1,power_law_1.01,0.44336638450622556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,2,1,power_law_1.01,0.4465151786804199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,2,1,power_law_1.2,0.4585984230041504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,2,1,power_law_1.2,0.4605504035949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,4,1,balanced,0.2799786726633708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,4,1,balanced,0.2807626724243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,4,1,power_law_1.01,0.26993279457092284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,4,1,power_law_1.01,0.2717375993728638
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,4,1,power_law_1.2,0.27866239547729493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,4,1,power_law_1.2,0.2868096113204956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,8,1,balanced,0.18905067443847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,8,1,balanced,0.18930667638778687
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,8,1,power_law_1.01,0.18231680393218994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,8,1,power_law_1.01,0.18326400518417357
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,8,1,power_law_1.2,0.1847615957260132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,6144,2560,8,160,8,1,power_law_1.2,0.1863808035850525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,1,balanced,1.0815359751383464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,1,balanced,1.0838186740875244
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,1,power_law_1.01,1.131123161315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,1,power_law_1.01,1.132249641418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,1,power_law_1.2,1.1933440208435058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,1,power_law_1.2,1.210585594177246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,128,balanced,0.06214400132497152
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,128,balanced,0.06442666550477345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,128,power_law_1.01,0.06430720090866089
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,128,power_law_1.01,0.06498559713363647
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,128,power_law_1.2,0.06661760210990905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,128,power_law_1.2,0.06945919990539551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,16,balanced,0.1311199963092804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,16,balanced,0.13433600465456644
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,16,power_law_1.01,0.12573440074920655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,16,power_law_1.01,0.12851840257644653
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,16,power_law_1.2,0.13018879890441895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,16,power_law_1.2,0.13909120559692384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,2,balanced,0.5144160191218058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,2,balanced,0.51473601659139
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,2,power_law_1.01,0.5244927883148194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,2,power_law_1.01,0.5410304069519043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,2,power_law_1.2,0.5569791793823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,2,power_law_1.2,0.5627583980560302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,256,balanced,0.06022400160630544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,256,balanced,0.06025599936644236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,256,power_law_1.01,0.05913599729537964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,256,power_law_1.01,0.06182399988174438
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,256,power_law_1.2,0.06097919940948486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,256,power_law_1.2,0.061689597368240354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,32,balanced,0.10084799925486247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,32,balanced,0.10253866513570149
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,32,power_law_1.01,0.09420160055160523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,32,power_law_1.01,0.09479039907455444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,32,power_law_1.2,0.09886080026626587
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,32,power_law_1.2,0.1013375997543335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,4,balanced,0.3237173358599345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,4,balanced,0.3312693238258362
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,4,power_law_1.01,0.29448959827423093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,4,power_law_1.01,0.3004863977432251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,4,power_law_1.2,0.3093760013580322
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,4,power_law_1.2,0.31690239906311035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,64,balanced,0.0796319991350174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,64,balanced,0.08180266618728638
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,64,power_law_1.01,0.0808896005153656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,64,power_law_1.01,0.08134400248527526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,64,power_law_1.2,0.07782400250434876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,64,power_law_1.2,0.08346880078315735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,8,balanced,0.3675040006637573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,8,balanced,0.37961065769195557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,8,power_law_1.01,0.24416639804840087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,8,power_law_1.01,0.2645632028579712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,8,power_law_1.2,0.25207040309906004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,1,8,power_law_1.2,0.2531775951385498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,16,1,balanced,0.20397865772247314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,16,1,balanced,0.20458666483561197
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,16,1,power_law_1.01,0.20566399097442628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,16,1,power_law_1.01,0.20780160427093505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,16,1,power_law_1.2,0.20830719470977782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,16,1,power_law_1.2,0.2089855909347534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,2,1,balanced,0.580069343249003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,2,1,balanced,0.5803039868672689
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,2,1,power_law_1.01,0.5932096004486084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,2,1,power_law_1.01,0.5937280178070068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,2,1,power_law_1.2,0.6278079986572266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,2,1,power_law_1.2,0.6285120010375976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,32,1,balanced,0.18474133809407553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,32,1,balanced,0.18491733074188232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,32,1,power_law_1.01,0.18329600095748902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,32,1,power_law_1.01,0.18332799673080444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,32,1,power_law_1.2,0.1856511950492859
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,32,1,power_law_1.2,0.18636159896850585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,4,1,balanced,0.3526773452758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,4,1,balanced,0.3551946481068929
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,4,1,power_law_1.01,0.3501440048217773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,4,1,power_law_1.01,0.35319039821624754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,4,1,power_law_1.2,0.36459519863128664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,4,1,power_law_1.2,0.368121600151062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,8,1,balanced,0.24726400772730509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,8,1,balanced,0.24733867247899374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,8,1,power_law_1.01,0.2449984073638916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,8,1,power_law_1.01,0.24804480075836183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,8,1,power_law_1.2,0.2539328098297119
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,256,8,1,power_law_1.2,0.2543423891067505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,1,balanced,1.5680425961812336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,1,balanced,1.6798399289449055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,1,power_law_1.01,1.7520639419555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,1,power_law_1.01,1.779596710205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,1,power_law_1.2,1.8310720443725585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,1,power_law_1.2,1.8430912017822265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,128,balanced,0.07031466563542683
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,128,balanced,0.07044266661008199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,128,power_law_1.01,0.0686784029006958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,128,power_law_1.01,0.07003520131111145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,128,power_law_1.2,0.07071999907493591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,128,power_law_1.2,0.07217280268669128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,16,balanced,0.23667200406392416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,16,balanced,0.24228266874949136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,16,power_law_1.01,0.1603775978088379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,16,power_law_1.01,0.16684800386428833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,16,power_law_1.2,0.17342079877853395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,16,power_law_1.2,0.19029120206832886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,2,balanced,0.7310506502787272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,2,balanced,0.7311147054036459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,2,power_law_1.01,0.7484159946441651
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,2,power_law_1.01,0.7514560222625732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,2,power_law_1.2,0.761568021774292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,2,power_law_1.2,0.7765503883361816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,32,balanced,0.11338133613268535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,32,balanced,0.11840533216794331
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,32,power_law_1.01,0.10550400018692016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,32,power_law_1.01,0.11197439432144166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,32,power_law_1.2,0.1071552038192749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,32,power_law_1.2,0.11879680156707764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,4,balanced,0.39700265725453693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,4,balanced,0.3970666726430257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,4,power_law_1.01,0.36959359645843504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,4,power_law_1.01,0.38100481033325195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,4,power_law_1.2,0.38759679794311525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,4,power_law_1.2,0.3878015995025635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,64,balanced,0.0928000013033549
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,64,balanced,0.09360000491142273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,64,power_law_1.01,0.08737919926643371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,64,power_law_1.01,0.08896639943122864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,64,power_law_1.2,0.08634240031242371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,64,power_law_1.2,0.0908735990524292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,8,balanced,0.2517919937769572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,8,balanced,0.25356266895929974
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,8,power_law_1.01,0.22225921154022216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,8,power_law_1.01,0.23067519664764405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,8,power_law_1.2,0.2189120054244995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,1,8,power_law_1.2,0.2323904037475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,16,1,balanced,0.2751413385073344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,16,1,balanced,0.27586666742960614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,16,1,power_law_1.01,0.29656319618225097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,16,1,power_law_1.01,0.29916160106658934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,16,1,power_law_1.2,0.3011967897415161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,16,1,power_law_1.2,0.30201599597930906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,2,1,balanced,0.8275466759999593
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,2,1,balanced,0.832698663075765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,2,1,power_law_1.01,0.9094400405883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,2,1,power_law_1.01,0.9103232383728027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,2,1,power_law_1.2,0.945139217376709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,2,1,power_law_1.2,0.9454527854919433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,32,1,balanced,0.2462559938430786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,32,1,balanced,0.24714666604995728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,32,1,power_law_1.01,0.2677695989608765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,32,1,power_law_1.01,0.2682687997817993
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,32,1,power_law_1.2,0.26869759559631345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,32,1,power_law_1.2,0.2700479984283447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,4,1,balanced,0.4859679937362671
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,4,1,balanced,0.4878186782201131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,4,1,power_law_1.01,0.5212031841278076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,4,1,power_law_1.01,0.5263040065765381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,4,1,power_law_1.2,0.5372672080993652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,4,1,power_law_1.2,0.544313621520996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,8,1,balanced,0.33618664741516113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,8,1,balanced,0.33671998977661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,8,1,power_law_1.01,0.3625983953475952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,8,1,power_law_1.01,0.3630143880844116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,8,1,power_law_1.2,0.3696000099182129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,768,7168,2048,8,384,8,1,power_law_1.2,0.3706239938735962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,1,balanced,0.055258666475613914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,1,balanced,0.05608533322811127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,1,power_law_1.01,0.0470335990190506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,1,power_law_1.01,0.04801279902458191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,1,power_law_1.2,0.04442879855632782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,1,power_law_1.2,0.04444800019264221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,128,balanced,0.02497600018978119
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,128,balanced,0.027109332382678986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,128,power_law_1.01,0.02377600073814392
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,128,power_law_1.01,0.025497600436210632
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,128,power_law_1.2,0.023289600014686586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,128,power_law_1.2,0.02420479953289032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,16,balanced,0.025397333006064098
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,16,balanced,0.025429333249727886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,16,power_law_1.01,0.024748800694942473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,16,power_law_1.01,0.02481279969215393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,16,power_law_1.2,0.02479359954595566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,16,power_law_1.2,0.025088000297546386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,2,balanced,0.03368533402681351
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,2,balanced,0.03532800078392029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,2,power_law_1.01,0.03516800105571747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,2,power_law_1.01,0.03544319868087768
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,2,power_law_1.2,0.032416000962257385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,2,power_law_1.2,0.033164799213409424
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,32,balanced,0.025301332275072735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,32,balanced,0.025514667232831318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,32,power_law_1.01,0.023481599986553192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,32,power_law_1.01,0.023558400571346283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,32,power_law_1.2,0.021964800357818604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,32,power_law_1.2,0.02346239984035492
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,4,balanced,0.02976000060637792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,4,balanced,0.030879999200503033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,4,power_law_1.01,0.02808319926261902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,4,power_law_1.01,0.029145601391792297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,4,power_law_1.2,0.027513599395751952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,4,power_law_1.2,0.027993598580360414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,64,balanced,0.023370665808518726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,64,balanced,0.025279998779296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,64,power_law_1.01,0.022124800086021423
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,64,power_law_1.01,0.023865599930286408
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,64,power_law_1.2,0.022291199862957002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,64,power_law_1.2,0.022566400468349457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,8,balanced,0.026320000489552815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,8,balanced,0.0271573339899381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,8,power_law_1.01,0.026316800713539125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,8,power_law_1.01,0.026348799467086792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,8,power_law_1.2,0.026892799139022826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,1,8,power_law_1.2,0.02771199941635132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,2,1,balanced,0.03541333228349686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,2,1,balanced,0.037632000943024956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,2,1,power_law_1.01,0.03268480002880096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,2,1,power_law_1.01,0.033542400598526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,2,1,power_law_1.2,0.031488001346588135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,2,1,power_law_1.2,0.03237760066986084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,4,1,balanced,0.030554667115211487
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,4,1,balanced,0.03123733401298523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,4,1,power_law_1.01,0.028224000334739686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,4,1,power_law_1.01,0.028364801406860353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,4,1,power_law_1.2,0.02778880000114441
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,2048,768,8,128,4,1,power_law_1.2,0.028019198775291444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,1,balanced,0.10001066327095032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,1,balanced,0.1009386678536733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,1,power_law_1.01,0.09808639883995056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,1,power_law_1.01,0.09816960096359253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,1,power_law_1.2,0.09091839790344239
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,1,power_law_1.2,0.09145600199699402
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,128,balanced,0.023183998962243397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,128,balanced,0.025205334027608235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,128,power_law_1.01,0.024115200340747833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,128,power_law_1.01,0.024563199281692503
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,128,power_law_1.2,0.02290560007095337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,128,power_law_1.2,0.023347200453281404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,16,balanced,0.027466667195161183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,16,balanced,0.02755733331044515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,16,power_law_1.01,0.04595839977264404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,16,power_law_1.01,0.04599039852619171
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,16,power_law_1.2,0.0455487996339798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,16,power_law_1.2,0.04574080109596253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,2,balanced,0.06447466711203258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,2,balanced,0.06503466765085857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,2,power_law_1.01,0.07351040244102477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,2,power_law_1.01,0.07507839798927307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,2,power_law_1.2,0.0671999990940094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,2,power_law_1.2,0.06963840126991272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,256,balanced,0.027589333554108936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,256,balanced,0.02826133370399475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,256,power_law_1.01,0.02455040067434311
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,256,power_law_1.01,0.02550399899482727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,256,power_law_1.2,0.024255999922752382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,256,power_law_1.2,0.024736000597476958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,32,balanced,0.02741866558790207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,32,balanced,0.027461332579453785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,32,power_law_1.01,0.02770560085773468
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,32,power_law_1.01,0.031385600566864014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,32,power_law_1.2,0.028780800104141236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,32,power_law_1.2,0.028908801078796387
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,4,balanced,0.046682665745417275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,4,balanced,0.04790399968624115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,4,power_law_1.01,0.061766397953033444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,4,power_law_1.01,0.0639360010623932
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,4,power_law_1.2,0.06007680296897888
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,4,power_law_1.2,0.061868798732757566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,64,balanced,0.025199999411900837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,64,balanced,0.025466665625572205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,64,power_law_1.01,0.025248000025749208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,64,power_law_1.01,0.02778880000114441
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,64,power_law_1.2,0.025830399990081788
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,64,power_law_1.2,0.026598399877548216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,8,balanced,0.03214933226505915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,8,balanced,0.03307733436425527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,8,power_law_1.01,0.05264000296592712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,8,power_law_1.01,0.054636800289154054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,8,power_law_1.2,0.046367999911308286
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,1,8,power_law_1.2,0.051596802473068235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,2,1,balanced,0.06736533343791962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,2,1,balanced,0.06759466727574666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,2,1,power_law_1.01,0.0648256003856659
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,2,1,power_law_1.01,0.0649407982826233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,2,1,power_law_1.2,0.06069120168685913
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,2,1,power_law_1.2,0.06304640173912049
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,4,1,balanced,0.04808000226815542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,4,1,balanced,0.04864533245563507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,4,1,power_law_1.01,0.04570240080356598
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,4,1,power_law_1.01,0.047244799137115476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,4,1,power_law_1.2,0.045542401075363156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,4,1,power_law_1.2,0.046035200357437134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,8,1,balanced,0.03380800038576126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,8,1,balanced,0.03537066777547201
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,8,1,power_law_1.01,0.03555200099945068
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,8,1,power_law_1.01,0.037254399061203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,8,1,power_law_1.2,0.034195199608802795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,3072,1536,8,256,8,1,power_law_1.2,0.034483200311660765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,1,balanced,0.1398293375968933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,1,balanced,0.14059733351071677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,1,power_law_1.01,0.1353983998298645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,1,power_law_1.2,0.13282560110092162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,1,power_law_1.2,0.13571840524673462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,2,balanced,0.08399466673533122
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,2,balanced,0.08541867136955261
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,2,power_law_1.01,0.08085119724273682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,2,power_law_1.01,0.08139520287513732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,2,power_law_1.2,0.0834496021270752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,2,power_law_1.2,0.08510079979896545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,4,balanced,0.05801600217819214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,4,balanced,0.05978133281071981
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,4,power_law_1.01,0.05741440057754517
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,4,power_law_1.01,0.05779839754104614
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,4,power_law_1.2,0.0573311984539032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,4,power_law_1.2,0.05817599892616272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,8,balanced,0.04218666752179464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,8,balanced,0.04343999922275543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,8,power_law_1.01,0.04139519929885864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,8,power_law_1.01,0.04156799912452698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,8,power_law_1.2,0.04073599874973297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,1,8,power_law_1.2,0.04248960018157959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,16,1,balanced,0.02941333254178365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,16,1,balanced,0.029509333272775013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,16,1,power_law_1.01,0.026892799139022826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,16,1,power_law_1.01,0.028947201371192933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,16,1,power_law_1.2,0.027616000175476073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,16,1,power_law_1.2,0.027750399708747864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,2,1,balanced,0.08497599760691325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,2,1,balanced,0.08550933003425598
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,2,1,power_law_1.01,0.08084480166435241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,2,1,power_law_1.01,0.0846015989780426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,2,1,power_law_1.2,0.0812991976737976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,2,1,power_law_1.2,0.08279039859771728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,32,1,balanced,0.026186667382717133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,32,1,balanced,0.02812266598145167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,32,1,power_law_1.01,0.025177600979804992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,32,1,power_law_1.01,0.027289599180221558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,32,1,power_law_1.2,0.02597759962081909
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,32,1,power_law_1.2,0.027372801303863527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,4,1,balanced,0.058101331194241844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,4,1,balanced,0.05827199916044871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,4,1,power_law_1.01,0.05490559935569763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,4,1,power_law_1.01,0.05559679865837097
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,4,1,power_law_1.2,0.0536575973033905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,4,1,power_law_1.2,0.05549439787864685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,8,1,balanced,0.036992001036802925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,8,1,balanced,0.03762666632731756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,8,1,power_law_1.01,0.0359360009431839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,8,1,power_law_1.01,0.03818880021572113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,8,1,power_law_1.2,0.03532800078392029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,14336,2,8,8,1,power_law_1.2,0.036108800768852235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,1,balanced,0.12379200259844463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,1,balanced,0.12380799651145935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,1,power_law_1.01,0.09653120040893555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,1,power_law_1.01,0.09745280146598816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,1,power_law_1.2,0.09034879803657532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,1,power_law_1.2,0.09107840061187744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,128,balanced,0.027456000447273254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,128,balanced,0.02917333443959554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,128,power_law_1.01,0.0274944007396698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,128,power_law_1.01,0.02776319980621338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,128,power_law_1.2,0.025536000728607178
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,128,power_law_1.2,0.02771199941635132
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,16,balanced,0.027749332288901012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,16,balanced,0.028954667349656422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,16,power_law_1.01,0.031737598776817325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,16,power_law_1.01,0.03221760094165802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,16,power_law_1.2,0.03056640028953552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,16,power_law_1.2,0.030854400992393494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,2,balanced,0.0761599987745285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,2,balanced,0.07759466767311096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,2,power_law_1.01,0.06763520240783691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,2,power_law_1.01,0.06846079826354981
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,2,power_law_1.2,0.0606656014919281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,2,power_law_1.2,0.06313599944114685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,32,balanced,0.026821332673231762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,32,balanced,0.02743999908367793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,32,power_law_1.01,0.02593280076980591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,32,power_law_1.01,0.02629759907722473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,32,power_law_1.2,0.025593599677085875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,32,power_law_1.2,0.025900799036026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,4,balanced,0.05363733569780985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,4,balanced,0.054133335749308266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,4,power_law_1.01,0.05615360140800476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,4,power_law_1.01,0.05742719769477844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,4,power_law_1.2,0.048441600799560544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,4,power_law_1.2,0.05076479911804199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,64,balanced,0.025386666258176167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,64,balanced,0.027493332823117573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,64,power_law_1.01,0.024672000110149382
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,64,power_law_1.01,0.02629759907722473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,64,power_law_1.2,0.024646399915218352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,64,power_law_1.2,0.025900799036026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,8,balanced,0.032655999064445496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,8,balanced,0.03430933256944021
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,8,power_law_1.01,0.03992320001125336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,8,power_law_1.01,0.04594559967517853
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,8,power_law_1.2,0.04216960072517395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,1,8,power_law_1.2,0.04661760032176972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,2,1,balanced,0.07952000200748444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,2,1,balanced,0.07986666758855183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,2,1,power_law_1.01,0.06736639738082886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,2,1,power_law_1.01,0.06808320283889771
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,2,1,power_law_1.2,0.060102397203445436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,2,1,power_law_1.2,0.06327679753303528
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,4,1,balanced,0.05532800157864889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,4,1,balanced,0.05782933533191681
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,4,1,power_law_1.01,0.04767360091209412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,4,1,power_law_1.01,0.04875519871711731
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,4,1,power_law_1.2,0.044326400756835936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,4,1,power_law_1.2,0.044710400700569156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,8,1,balanced,0.03770666569471359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,8,1,balanced,0.04008000095685323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,8,1,power_law_1.01,0.035283198952674864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,8,1,power_law_1.01,0.0357120007276535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,8,1,power_law_1.2,0.032569599151611325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,4096,1536,8,128,8,1,power_law_1.2,0.033843201398849485
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,1,balanced,0.21969600518544516
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,1,balanced,0.21970667441685995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,1,power_law_1.01,0.2085184097290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,1,power_law_1.01,0.21264638900756835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,1,power_law_1.2,0.21186559200286864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,1,power_law_1.2,0.21398398876190186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,2,balanced,0.12708800037701926
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,2,balanced,0.12928533554077148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,2,power_law_1.01,0.12503679990768432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,2,power_law_1.01,0.12627840042114258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,2,power_law_1.2,0.12119040489196778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,2,power_law_1.2,0.12669440507888793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,4,balanced,0.07750399907430013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,4,balanced,0.07852266728878021
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,4,power_law_1.01,0.07612800002098083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,4,power_law_1.01,0.07789440155029297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,4,power_law_1.2,0.07707520127296448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,4,power_law_1.2,0.0789247989654541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,8,balanced,0.05550933380921682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,8,balanced,0.05625600119431814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,8,power_law_1.01,0.05367680191993714
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,8,power_law_1.01,0.05394560098648071
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,8,power_law_1.2,0.05446400046348572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,1,8,power_law_1.2,0.05572479963302612
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,16,1,balanced,0.03244800120592117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,16,1,balanced,0.03364799916744232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,16,1,power_law_1.01,0.031231999397277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,16,1,power_law_1.01,0.03193599879741669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,16,1,power_law_1.2,0.03081600069999695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,16,1,power_law_1.2,0.03121280074119568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,2,1,balanced,0.12366933623949687
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,2,1,balanced,0.12544533610343933
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,2,1,power_law_1.01,0.11905280351638795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,2,1,power_law_1.01,0.12146559953689576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,2,1,power_law_1.2,0.11645439863204957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,2,1,power_law_1.2,0.12284159660339355
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,32,1,balanced,0.029525332152843475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,32,1,balanced,0.029616000751654308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,32,1,power_law_1.01,0.027551999688148497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,32,1,power_law_1.01,0.02813439965248108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,32,1,power_law_1.2,0.027033600211143493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,32,1,power_law_1.2,0.027590399980545043
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,4,1,balanced,0.0786293347676595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,4,1,balanced,0.07903466622034709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,4,1,power_law_1.01,0.07474560141563416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,4,1,power_law_1.01,0.07577599883079529
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,4,1,power_law_1.2,0.0733568012714386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,4,1,power_law_1.2,0.07653120160102844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,8,1,balanced,0.05305066704750061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,8,1,balanced,0.05485333502292633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,8,1,power_law_1.01,0.05070080161094666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,8,1,power_law_1.01,0.05112959742546082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,8,1,power_law_1.2,0.05161600112915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,16384,2,8,8,1,power_law_1.2,0.05258880257606506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,1,balanced,0.2153973380724589
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,1,balanced,0.2164693276087443
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,1,power_law_1.01,0.21163520812988282
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,1,power_law_1.01,0.21425280570983887
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,1,power_law_1.2,0.19986560344696044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,128,balanced,0.02942399928967158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,128,balanced,0.02942933390537898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,128,power_law_1.01,0.028326401114463808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,128,power_law_1.01,0.031379199028015135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,128,power_law_1.2,0.027878400683403016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,128,power_law_1.2,0.02810879945755005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,16,balanced,0.033728001018365227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,16,balanced,0.03558400024970373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,16,power_law_1.01,0.07468159794807434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,16,power_law_1.01,0.07590399980545044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,16,power_law_1.2,0.07621759772300721
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,16,power_law_1.2,0.07735040187835693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,2,balanced,0.12366933623949687
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,2,balanced,0.123690664768219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,2,power_law_1.01,0.14284160137176513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,2,power_law_1.01,0.14869760274887084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,2,power_law_1.2,0.12995840311050416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,2,power_law_1.2,0.1301568031311035
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,256,balanced,0.029130667448043823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,256,balanced,0.029445332785447437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,256,power_law_1.01,0.02746239900588989
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,256,power_law_1.01,0.029228800535202028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,256,power_law_1.2,0.027372801303863527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,256,power_law_1.2,0.02744320034980774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,32,balanced,0.02924799919128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,32,balanced,0.02957333376010259
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,32,power_law_1.01,0.05172479748725891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,32,power_law_1.01,0.0521664023399353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,32,power_law_1.2,0.05167359709739685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,32,power_law_1.2,0.05317760109901428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,4,balanced,0.07739200194676717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,4,balanced,0.07831466694672902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,4,power_law_1.01,0.10567679405212402
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,4,power_law_1.01,0.10929280519485474
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,4,power_law_1.2,0.10748800039291381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,4,power_law_1.2,0.10870399475097656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,64,balanced,0.028501334289709728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,64,balanced,0.02942399928967158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,64,power_law_1.01,0.03164800107479095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,64,power_law_1.01,0.032358399033546446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,64,power_law_1.2,0.030527999997138976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,64,power_law_1.2,0.031795200705528257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,8,balanced,0.05407466491063436
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,8,balanced,0.05412800113360087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,8,power_law_1.01,0.09244160056114196
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,8,power_law_1.01,0.09502720236778259
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,8,power_law_1.2,0.0853056013584137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,1,8,power_law_1.2,0.08956800103187561
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,16,1,balanced,0.041493333876132965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,16,1,balanced,0.0423573354880015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,16,1,power_law_1.01,0.04287999868392944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,16,1,power_law_1.01,0.04318079948425293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,16,1,power_law_1.2,0.040575999021530154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,16,1,power_law_1.2,0.0409280002117157
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,2,1,balanced,0.1243839959303538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,2,1,balanced,0.12490133444468181
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,2,1,power_law_1.01,0.1221119999885559
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,2,1,power_law_1.01,0.12378879785537719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,2,1,power_law_1.2,0.11315200328826905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,2,1,power_law_1.2,0.11614079475402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,32,1,balanced,0.0376800000667572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,32,1,balanced,0.03770666569471359
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,32,1,power_law_1.01,0.036447998881340024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,32,1,power_law_1.01,0.03749119937419891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,32,1,power_law_1.2,0.035776001214981076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,32,1,power_law_1.2,0.03622399866580963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,4,1,balanced,0.08003200093905131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,4,1,balanced,0.08045866588751475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,4,1,power_law_1.01,0.07722880244255066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,4,1,power_law_1.01,0.07768319845199585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,4,1,power_law_1.2,0.0736191987991333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,4,1,power_law_1.2,0.07368959784507752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,8,1,balanced,0.057855998476346336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,8,1,balanced,0.05807466804981232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,8,1,power_law_1.01,0.05511680245399475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,8,1,power_law_1.01,0.05589759945869446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,8,1,power_law_1.2,0.05225600004196167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2048,8,256,8,1,power_law_1.2,0.053011202812194826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,1,balanced,0.26263999938964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,1,balanced,0.26358399788538617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,1,power_law_1.01,0.22105600833892822
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,1,power_law_1.01,0.2232640027999878
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,1,power_law_1.2,0.20067200660705567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,1,power_law_1.2,0.20194559097290038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,16,balanced,0.040149333576361336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,16,balanced,0.04331733286380768
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,16,power_law_1.01,0.06500480175018311
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,16,power_law_1.01,0.06513280272483826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,16,power_law_1.2,0.06519039869308471
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,16,power_law_1.2,0.06629120111465454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,2,balanced,0.14762133359909058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,2,balanced,0.14803733428319296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,2,power_law_1.01,0.14154239892959594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,2,power_law_1.01,0.14570239782333375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,2,power_law_1.2,0.12579840421676636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,2,power_law_1.2,0.13207039833068848
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,32,balanced,0.02956799914439519
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,32,balanced,0.03151999910672506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,32,power_law_1.01,0.0459199994802475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,32,power_law_1.01,0.048640000820159915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,32,power_law_1.2,0.035795199871063235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,32,power_law_1.2,0.043859198689460754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,4,balanced,0.0890773336092631
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,4,balanced,0.08917333682378133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,4,power_law_1.01,0.10619519948959351
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,4,power_law_1.01,0.11006079912185669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,4,power_law_1.2,0.10384000539779663
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,4,power_law_1.2,0.11375999450683594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,8,balanced,0.062234664956728615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,8,balanced,0.06233599781990051
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,8,power_law_1.01,0.08711040019989014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,8,power_law_1.01,0.08853759765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,8,power_law_1.2,0.08730880022048951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,1,8,power_law_1.2,0.08903040289878845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,2,1,balanced,0.14792533715566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,2,1,balanced,0.14805333813031515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,2,1,power_law_1.01,0.12677760124206544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,2,1,power_law_1.01,0.12828160524368287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,2,1,power_law_1.2,0.11710079908370971
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,2,1,power_law_1.2,0.11822719573974609
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,4,1,balanced,0.09457066655158997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,4,1,balanced,0.09517332911491394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,4,1,power_law_1.01,0.08118399977684021
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,4,1,power_law_1.01,0.08440960049629212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,4,1,power_law_1.2,0.07663360238075256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,4,1,power_law_1.2,0.07767040133476258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,8,1,balanced,0.06602666775385539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,8,1,balanced,0.06617600222428639
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,8,1,power_law_1.01,0.056383997201919556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,8,1,power_law_1.01,0.05707520246505737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,8,1,power_law_1.2,0.05326719880104065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,6144,2560,8,160,8,1,power_law_1.2,0.054073601961135864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,1,balanced,0.24706665674845377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,1,balanced,0.2476053237915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,1,power_law_1.01,0.24506878852844238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,1,power_law_1.01,0.24618880748748778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,1,power_law_1.2,0.2186880111694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,1,power_law_1.2,0.2243583917617798
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,128,balanced,0.03121600051720937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,128,balanced,0.03143466760714849
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,128,power_law_1.01,0.029254400730133058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,128,power_law_1.01,0.030022400617599487
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,128,power_law_1.2,0.029120001196861266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,128,power_law_1.2,0.031071999669075014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,16,balanced,0.035642666121323906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,16,balanced,0.037818667789300285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,16,power_law_1.01,0.08416000008583069
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,16,power_law_1.01,0.08424320220947265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,16,power_law_1.2,0.08418560028076172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,16,power_law_1.2,0.08437119722366333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,2,balanced,0.14037866393725076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,2,balanced,0.14076266686121622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,2,power_law_1.01,0.165830397605896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,2,power_law_1.01,0.1670016050338745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,2,power_law_1.2,0.14999040365219116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,2,power_law_1.2,0.15385600328445434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,256,balanced,0.029445332785447437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,256,balanced,0.029493334392706554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,256,power_law_1.01,0.027987200021743774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,256,power_law_1.01,0.030067199468612672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,256,power_law_1.2,0.029369598627090453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,256,power_law_1.2,0.029843199253082275
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,32,balanced,0.031210665901501972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,32,balanced,0.031248000760873158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,32,power_law_1.01,0.055776000022888184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,32,power_law_1.01,0.05736960172653198
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,32,power_law_1.2,0.05560960173606873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,32,power_law_1.2,0.057036799192428586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,4,balanced,0.08604799707730611
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,4,balanced,0.08608532945315044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,4,power_law_1.01,0.11720319986343383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,4,power_law_1.01,0.1288383960723877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,4,power_law_1.2,0.11355520486831665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,4,power_law_1.2,0.11683199405670167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,64,balanced,0.029552000264326733
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,64,balanced,0.029989334444204967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,64,power_law_1.01,0.036313599348068236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,64,power_law_1.01,0.03653120100498199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,64,power_law_1.2,0.03285120129585266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,64,power_law_1.2,0.03459199965000152
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,8,balanced,0.05810666580994924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,8,balanced,0.058559998869895935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,8,power_law_1.01,0.09749119877815246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,8,power_law_1.01,0.10280319452285766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,8,power_law_1.2,0.09084799885749817
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,1,8,power_law_1.2,0.10893440246582031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,16,1,balanced,0.04738133152325948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,16,1,balanced,0.047781333327293396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,16,1,power_law_1.01,0.04631040096282959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,16,1,power_law_1.01,0.0482367992401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,16,1,power_law_1.2,0.04445439875125885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,16,1,power_law_1.2,0.046086400747299194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,2,1,balanced,0.13981866836547852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,2,1,balanced,0.1421119968096415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,2,1,power_law_1.01,0.13842560052871705
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,2,1,power_law_1.01,0.13964799642562867
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,2,1,power_law_1.2,0.12643840312957763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,2,1,power_law_1.2,0.12940160036087037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,32,1,balanced,0.04062400013208389
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,32,1,balanced,0.041562666495641075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,32,1,power_law_1.01,0.04058879911899567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,32,1,power_law_1.01,0.04081920087337494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,32,1,power_law_1.2,0.03829759955406189
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,32,1,power_law_1.2,0.03844479918479919
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,4,1,balanced,0.08819199601809184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,4,1,balanced,0.08874133229255676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,4,1,power_law_1.01,0.08614400029182434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,4,1,power_law_1.01,0.08634240031242371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,4,1,power_law_1.2,0.07739520072937012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,4,1,power_law_1.2,0.08142079710960388
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,8,1,balanced,0.06228800117969513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,8,1,balanced,0.06252799928188324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,8,1,power_law_1.01,0.06054400205612183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,8,1,power_law_1.01,0.06094080209732056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,8,1,power_law_1.2,0.056620800495147706
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,256,8,1,power_law_1.2,0.057894402742385866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,1,balanced,0.2472533384958903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,1,balanced,0.24850666522979736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,1,power_law_1.01,0.24442880153656005
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,1,power_law_1.01,0.2466559886932373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,1,power_law_1.2,0.24542078971862794
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,1,power_law_1.2,0.2457535982131958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,128,balanced,0.029546665648619335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,128,balanced,0.03148799886306127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,128,power_law_1.01,0.031251201033592226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,128,power_law_1.01,0.03133440017700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,128,power_law_1.2,0.03155840039253235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,128,power_law_1.2,0.03158400058746338
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,16,balanced,0.037658666570981346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,16,balanced,0.03796799977620443
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,16,power_law_1.01,0.10654720067977905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,16,power_law_1.01,0.10795520544052124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,16,power_law_1.2,0.10215679407119752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,16,power_law_1.2,0.10447360277175903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,2,balanced,0.139765332142512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,2,balanced,0.14071999986966452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,2,power_law_1.01,0.17255040407180786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,2,power_law_1.01,0.17757439613342285
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,2,power_law_1.2,0.16870399713516235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,2,power_law_1.2,0.1810431957244873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,32,balanced,0.03161066770553589
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,32,balanced,0.03178133318821589
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,32,power_law_1.01,0.07000960111618042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,32,power_law_1.01,0.07055360078811646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,32,power_law_1.2,0.0686079978942871
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,32,power_law_1.2,0.07069439888000488
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,4,balanced,0.08477333188056946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,4,balanced,0.08521067102750142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,4,power_law_1.01,0.13316479921340943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,4,power_law_1.01,0.1369920015335083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,4,power_law_1.2,0.14254720211029054
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,4,power_law_1.2,0.1459712028503418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,64,balanced,0.029450667401154835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,64,balanced,0.030789333085219067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,64,power_law_1.01,0.05090559720993042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,64,power_law_1.01,0.05156480073928833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,64,power_law_1.2,0.05077760219573975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,64,power_law_1.2,0.051020801067352295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,8,balanced,0.058431997895240784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,8,balanced,0.059263999263445534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,8,power_law_1.01,0.11315840482711792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,8,power_law_1.01,0.1145792007446289
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,8,power_law_1.2,0.11827839612960815
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,1,8,power_law_1.2,0.13320319652557372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,16,1,balanced,0.045567999283472695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,16,1,balanced,0.047824000318845115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,16,1,power_law_1.01,0.048019200563430786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,16,1,power_law_1.01,0.04802559912204742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,16,1,power_law_1.2,0.048153600096702574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,16,1,power_law_1.2,0.048902401328086854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,2,1,balanced,0.14049599568049112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,2,1,balanced,0.14071999986966452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,2,1,power_law_1.01,0.1381824016571045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,2,1,power_law_1.01,0.139027202129364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,2,1,power_law_1.2,0.14009599685668944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,2,1,power_law_1.2,0.14037760496139526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,32,1,balanced,0.03972266614437103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,32,1,balanced,0.04171200096607208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,32,1,power_law_1.01,0.03957119882106781
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,32,1,power_law_1.01,0.04012160003185272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,32,1,power_law_1.2,0.03966079950332642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,32,1,power_law_1.2,0.03969280123710632
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,4,1,balanced,0.08681600292523702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,4,1,balanced,0.08771199981371562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,4,1,power_law_1.01,0.08492159843444824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,4,1,power_law_1.01,0.08643839955329895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,4,1,power_law_1.2,0.08610560297966004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,4,1,power_law_1.2,0.0862335979938507
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,8,1,balanced,0.06298666695753734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,8,1,balanced,0.06301333506902058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,8,1,power_law_1.01,0.06047999858856201
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,8,1,power_law_1.01,0.06107519865036011
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,8,1,power_law_1.2,0.06099200248718262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8,7168,2048,8,384,8,1,power_law_1.2,0.06124160289764404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,1,balanced,0.08397866288820903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,1,balanced,0.0844693382581075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,1,power_law_1.01,0.07898880243301391
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,1,power_law_1.01,0.08080000281333924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,1,power_law_1.2,0.07998080253601074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,1,power_law_1.2,0.08028159737586975
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,128,balanced,0.03547733277082443
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,128,balanced,0.03707200040419897
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,128,power_law_1.01,0.03371520042419433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,128,power_law_1.01,0.03492479920387268
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,128,power_law_1.2,0.03314560055732727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,128,power_law_1.2,0.033964800834655764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,16,balanced,0.03352533280849457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,16,balanced,0.033530667424201965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,16,power_law_1.01,0.031302401423454286
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,16,power_law_1.01,0.031795200705528257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,16,power_law_1.2,0.03184640109539032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,16,power_law_1.2,0.03208959996700287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,2,balanced,0.05973866581916809
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,2,balanced,0.060085331400235496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,2,power_law_1.01,0.05550720095634461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,2,power_law_1.01,0.05729280114173889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,2,power_law_1.2,0.056934398412704465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,2,power_law_1.2,0.057894402742385866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,32,balanced,0.03774400055408478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,32,balanced,0.037903999288876854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,32,power_law_1.01,0.03581439852714539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,32,power_law_1.01,0.03638400137424469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,32,power_law_1.2,0.03498879969120026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,32,power_law_1.2,0.035648000240325925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,4,balanced,0.03775999943415324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,4,balanced,0.04200000067551931
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,4,power_law_1.01,0.037862399220466615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,4,power_law_1.01,0.03896960020065308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,4,power_law_1.2,0.03800320029258728
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,4,power_law_1.2,0.03935360014438629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,64,balanced,0.035599999129772186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,64,balanced,0.03742400060097376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,64,power_law_1.01,0.03437440097332001
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,64,power_law_1.01,0.03566080033779144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,64,power_law_1.2,0.03413119912147522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,64,power_law_1.2,0.034406399726867674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,8,balanced,0.035599999129772186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,8,balanced,0.035743998984495796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,8,power_law_1.01,0.033766400814056394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,8,power_law_1.01,0.0341376006603241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,8,power_law_1.2,0.03454079926013946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,1,8,power_law_1.2,0.03463680148124695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,2,1,balanced,0.05990933378537496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,2,1,balanced,0.06150400141874949
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,2,1,power_law_1.01,0.0586624026298523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,2,1,power_law_1.01,0.05983359813690185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,2,1,power_law_1.2,0.05866879820823669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,2,1,power_law_1.2,0.059571200609207155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,4,1,balanced,0.04176533222198486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,4,1,balanced,0.0436160018046697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,4,1,power_law_1.01,0.042233601212501526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,4,1,power_law_1.01,0.043398401141166686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,4,1,power_law_1.2,0.044627198576927186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,2048,768,8,128,4,1,power_law_1.2,0.044947201013565065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,1,balanced,0.3134666681289673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,1,balanced,0.3137600024541219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,1,power_law_1.01,0.24789121150970458
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,1,power_law_1.01,0.24993278980255126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,1,power_law_1.2,0.24948480129241943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,1,power_law_1.2,0.25150721073150634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,128,balanced,0.03977066775163015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,128,balanced,0.04083200047413508
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,128,power_law_1.01,0.038815999031066896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,128,power_law_1.01,0.03918080031871796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,128,power_law_1.2,0.038540801405906676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,128,power_law_1.2,0.038873600959777835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,16,balanced,0.05332266787687937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,16,balanced,0.05349333087603251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,16,power_law_1.01,0.0466623991727829
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,16,power_law_1.01,0.04761599898338318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,16,power_law_1.2,0.04938240051269531
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,16,power_law_1.2,0.04938879907131195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,2,balanced,0.1737226645151774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,2,balanced,0.1755519906679789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,2,power_law_1.01,0.1401792049407959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,2,power_law_1.01,0.14472320079803466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,2,power_law_1.2,0.1438655972480774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,2,power_law_1.2,0.14403200149536133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,256,balanced,0.039450667798519135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,256,balanced,0.039690665900707245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,256,power_law_1.01,0.0369024008512497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,256,power_law_1.01,0.037254399061203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,256,power_law_1.2,0.036185601353645326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,256,power_law_1.2,0.037036800384521486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,32,balanced,0.03972266614437103
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,32,balanced,0.03979733337958654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,32,power_law_1.01,0.03695360124111176
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,32,power_law_1.01,0.037862399220466615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,32,power_law_1.2,0.03609600067138672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,32,power_law_1.2,0.03849599957466125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,4,balanced,0.10513066252072652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,4,balanced,0.1055573324362437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,4,power_law_1.01,0.08812159895896912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,4,power_law_1.01,0.09267200231552124
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,4,power_law_1.2,0.0907584011554718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,4,power_law_1.2,0.09290879964828491
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,64,balanced,0.0436160018046697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,64,balanced,0.04378133515516917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,64,power_law_1.01,0.041126400232315063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,64,power_law_1.01,0.04147840142250061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,64,power_law_1.2,0.04116480052471161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,64,power_law_1.2,0.041971200704574586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,8,balanced,0.07038400073846181
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,8,balanced,0.0709440012772878
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,8,power_law_1.01,0.06156799793243408
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,8,power_law_1.01,0.06272000074386597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,8,power_law_1.2,0.06272000074386597
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,1,8,power_law_1.2,0.06309760212898255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,2,1,balanced,0.17769600947697958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,2,1,balanced,0.17838933070500693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,2,1,power_law_1.01,0.1445248007774353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,2,1,power_law_1.01,0.14479999542236327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,2,1,power_law_1.2,0.14455039501190187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,2,1,power_law_1.2,0.14495999813079835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,4,1,balanced,0.11105599999427795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,4,1,balanced,0.1114026705423991
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,4,1,power_law_1.01,0.09242240190505982
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,4,1,power_law_1.01,0.09336320161819459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,4,1,power_law_1.2,0.09300479888916016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,4,1,power_law_1.2,0.09473919868469238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,8,1,balanced,0.08212799827257793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,8,1,balanced,0.08276799817879994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,8,1,power_law_1.01,0.07234560251235962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,8,1,power_law_1.01,0.07373440265655518
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,8,1,power_law_1.2,0.07103360295295716
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,3072,1536,8,256,8,1,power_law_1.2,0.07223680019378662
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,1,balanced,0.17938133080800375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,1,balanced,0.18040533860524496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,1,power_law_1.01,0.17861119508743287
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,1,power_law_1.01,0.17938560247421265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,1,power_law_1.2,0.17408640384674073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,1,power_law_1.2,0.17683839797973633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,2,balanced,0.09134399890899658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,2,balanced,0.09499733646710713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,2,power_law_1.01,0.10173439979553223
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,2,power_law_1.01,0.10506240129470826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,2,power_law_1.2,0.10539519786834717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,2,power_law_1.2,0.10629119873046874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,4,balanced,0.09859200318654378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,4,balanced,0.09899733463923137
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,4,power_law_1.01,0.07527040243148804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,4,power_law_1.01,0.07841920256614685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,4,power_law_1.2,0.07448319792747497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,4,power_law_1.2,0.07719039916992188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,8,balanced,0.1738719940185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,8,balanced,0.1741066575050354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,8,power_law_1.01,0.10238080024719239
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,8,power_law_1.01,0.10858880281448365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,8,power_law_1.2,0.09306880235671997
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,1,8,power_law_1.2,0.09969279766082764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,16,1,balanced,0.03565333286921183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,16,1,balanced,0.035760000348091125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,16,1,power_law_1.01,0.033452799916267394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,16,1,power_law_1.01,0.0346560001373291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,16,1,power_law_1.2,0.03322240114212036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,16,1,power_law_1.2,0.03406080007553101
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,2,1,balanced,0.09940266609191895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,2,1,balanced,0.10045866171518962
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,2,1,power_law_1.01,0.09916800260543823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,2,1,power_law_1.01,0.1003775954246521
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,2,1,power_law_1.2,0.10060160160064698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,2,1,power_law_1.2,0.10130560398101807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,32,1,balanced,0.02945599953333537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,32,1,balanced,0.03156266609827677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,32,1,power_law_1.01,0.02876160144805908
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,32,1,power_law_1.01,0.030041599273681642
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,32,1,power_law_1.2,0.029555198550224305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,32,1,power_law_1.2,0.030214399099349976
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,4,1,balanced,0.0679253339767456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,4,1,balanced,0.06828799843788147
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,4,1,power_law_1.01,0.06440960168838501
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,4,1,power_law_1.01,0.06475520133972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,4,1,power_law_1.2,0.06425600051879883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,4,1,power_law_1.2,0.06446719765663148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,8,1,balanced,0.04991999765237173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,8,1,balanced,0.04995200037956238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,8,1,power_law_1.01,0.04563199877738953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,8,1,power_law_1.01,0.04725759923458099
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,8,1,power_law_1.2,0.04593920111656189
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,14336,2,8,8,1,power_law_1.2,0.046419200301170346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,1,balanced,0.22760534286499023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,1,balanced,0.2281493345896403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,1,power_law_1.01,0.212556791305542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,1,power_law_1.01,0.2147455930709839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,1,power_law_1.2,0.21463680267333984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,1,power_law_1.2,0.21822719573974608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,128,balanced,0.046384001771608986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,128,balanced,0.04721599817276001
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,128,power_law_1.01,0.04357120096683502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,128,power_law_1.01,0.043782401084899905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,128,power_law_1.2,0.04121600091457367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,128,power_law_1.2,0.0433023989200592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,16,balanced,0.060234665870666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,16,balanced,0.0665226678053538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,16,power_law_1.01,0.05586559772491455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,16,power_law_1.01,0.05637120008468628
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,16,power_law_1.2,0.05631999969482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,16,power_law_1.2,0.05674239993095398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,2,balanced,0.13105600078900656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,2,balanced,0.13177067041397095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,2,power_law_1.01,0.1241536021232605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,2,power_law_1.01,0.12458239793777466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,2,power_law_1.2,0.1269695997238159
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,2,power_law_1.2,0.12697600126266478
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,32,balanced,0.07870933413505554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,32,balanced,0.08081600069999695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,32,power_law_1.01,0.07017599940299987
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,32,power_law_1.01,0.07428479790687562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,32,power_law_1.2,0.07147520184516906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,32,power_law_1.2,0.07178879976272583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,4,balanced,0.08378133177757263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,4,balanced,0.0846506655216217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,4,power_law_1.01,0.0797760009765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,4,power_law_1.01,0.08012160062789916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,4,power_law_1.2,0.07912960052490234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,4,power_law_1.2,0.07991039752960205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,64,balanced,0.057258665561676025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,64,balanced,0.058464000622431435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,64,power_law_1.01,0.05184000134468079
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,64,power_law_1.01,0.057043200731277464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,64,power_law_1.2,0.05156480073928833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,64,power_law_1.2,0.05469440221786499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,8,balanced,0.06029333174228668
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,8,balanced,0.06266133487224579
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,8,power_law_1.01,0.05731840133666992
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,8,power_law_1.01,0.058841598033905027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,8,power_law_1.2,0.059411197900772095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,1,8,power_law_1.2,0.060172802209854125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,2,1,balanced,0.13224533200263977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,2,1,balanced,0.13381333152453104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,2,1,power_law_1.01,0.1261952042579651
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,2,1,power_law_1.01,0.12931840419769286
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,2,1,power_law_1.2,0.12798719406127929
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,2,1,power_law_1.2,0.13244800567626952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,4,1,balanced,0.08620267113049825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,4,1,balanced,0.0867680013179779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,4,1,power_law_1.01,0.08496639728546143
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,4,1,power_law_1.01,0.08592000007629394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,4,1,power_law_1.2,0.08540160059928895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,4,1,power_law_1.2,0.08681600093841553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,8,1,balanced,0.06682666639486949
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,8,1,balanced,0.06740266581376393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,8,1,power_law_1.01,0.06710399985313416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,8,1,power_law_1.01,0.06740480065345764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,8,1,power_law_1.2,0.06730239987373351
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,4096,1536,8,128,8,1,power_law_1.2,0.06759679913520814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,1,balanced,0.3601919809977214
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,1,balanced,0.3620426654815674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,1,power_law_1.01,0.3233151912689209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,1,power_law_1.01,0.34472320079803465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,1,power_law_1.2,0.319270396232605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,1,power_law_1.2,0.32666239738464353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,2,balanced,0.1381706694761912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,2,balanced,0.1388159990310669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,2,power_law_1.01,0.1616320013999939
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,2,power_law_1.01,0.1657472014427185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,2,power_law_1.2,0.15726720094680785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,2,power_law_1.2,0.1609279990196228
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,4,balanced,0.11859200398127238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,4,balanced,0.11989866693814595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,4,power_law_1.01,0.09258880019187928
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,4,power_law_1.01,0.0967423975467682
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,4,power_law_1.2,0.09847040176391601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,4,power_law_1.2,0.10660480260848999
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,8,balanced,0.19939200083414713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,8,balanced,0.2027519941329956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,8,power_law_1.01,0.11793919801712036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,8,power_law_1.01,0.13396480083465576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,8,power_law_1.2,0.12392319440841675
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,1,8,power_law_1.2,0.14215680360794067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,16,1,balanced,0.045109331607818604
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,16,1,balanced,0.04711466530958811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,16,1,power_law_1.01,0.04221439957618713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,16,1,power_law_1.01,0.04350079894065857
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,16,1,power_law_1.2,0.041631999611854556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,16,1,power_law_1.2,0.04276480078697205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,2,1,balanced,0.14915733536084494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,2,1,balanced,0.1498133341471354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,2,1,power_law_1.01,0.14680320024490356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,2,1,power_law_1.01,0.1526080012321472
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,2,1,power_law_1.2,0.14823039770126342
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,2,1,power_law_1.2,0.15121279954910277
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,32,1,balanced,0.03391999999682108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,32,1,balanced,0.03603733330965042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,32,1,power_law_1.01,0.03258880078792572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,32,1,power_law_1.01,0.033030399680137636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,32,1,power_law_1.2,0.0318336009979248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,32,1,power_law_1.2,0.03198080062866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,4,1,balanced,0.09296533465385437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,4,1,balanced,0.09429867068926494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,4,1,power_law_1.01,0.08891519904136658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,4,1,power_law_1.01,0.09192960262298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,4,1,power_law_1.2,0.08986240029335021
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,4,1,power_law_1.2,0.0927232027053833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,8,1,balanced,0.06320000191529591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,8,1,balanced,0.06440000236034393
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,8,1,power_law_1.01,0.05998079776763916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,8,1,power_law_1.01,0.061408001184463504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,8,1,power_law_1.2,0.060166400671005246
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,16384,2,8,8,1,power_law_1.2,0.06253439784049988
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,1,balanced,0.7811093330383301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,1,balanced,0.7825653553009033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,1,power_law_1.01,0.6138495922088623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,1,power_law_1.01,0.6250944137573242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,1,power_law_1.2,0.6121856212615967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,1,power_law_1.2,0.6123775959014892
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,128,balanced,0.07652799785137177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,128,balanced,0.07877333462238312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,128,power_law_1.01,0.07315840125083924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,128,power_law_1.01,0.07501440048217774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,128,power_law_1.2,0.07352960109710693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,128,power_law_1.2,0.07463679909706115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,16,balanced,0.08746133248011272
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,16,balanced,0.08798933029174805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,16,power_law_1.01,0.07964800000190735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,16,power_law_1.01,0.08084480166435241
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,16,power_law_1.2,0.08086400032043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,16,power_law_1.2,0.08244479894638061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,2,balanced,0.4097013473510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,2,balanced,0.4107840061187744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,2,power_law_1.01,0.32120959758758544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,2,power_law_1.01,0.3307391881942749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,2,power_law_1.2,0.32517759799957274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,2,power_law_1.2,0.3340480089187622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,256,balanced,0.0591786652803421
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,256,balanced,0.05963733295599619
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,256,power_law_1.01,0.05305600166320801
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,256,power_law_1.01,0.05754240155220032
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,256,power_law_1.2,0.05562880039215088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,256,power_law_1.2,0.056006401777267456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,32,balanced,0.088128000497818
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,32,balanced,0.09406399726867676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,32,power_law_1.01,0.08202239871025085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,32,power_law_1.01,0.08325120210647582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,32,power_law_1.2,0.07854080200195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,32,power_law_1.2,0.0834496021270752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,4,balanced,0.22304532925287882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,4,balanced,0.22643200556437174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,4,power_law_1.01,0.18625279664993286
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,4,power_law_1.01,0.20110719203948973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,4,power_law_1.2,0.18716800212860107
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,4,power_law_1.2,0.1922368049621582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,64,balanced,0.12066133817036946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,64,balanced,0.12171733379364014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,64,power_law_1.01,0.10652799606323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,64,power_law_1.01,0.11269760131835938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,64,power_law_1.2,0.10663679838180543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,64,power_law_1.2,0.10805759429931641
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,8,balanced,0.1309440036614736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,8,balanced,0.13193066914876303
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,8,power_law_1.01,0.1130944013595581
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,8,power_law_1.01,0.11575039625167846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,8,power_law_1.2,0.11337599754333497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,1,8,power_law_1.2,0.12154239416122437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,16,1,balanced,0.10989866654078166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,16,1,balanced,0.11030399799346924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,16,1,power_law_1.01,0.09504640102386475
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,16,1,power_law_1.01,0.09549440145492553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,16,1,power_law_1.2,0.09526399970054626
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,16,1,power_law_1.2,0.09546239972114563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,2,1,balanced,0.41105600198109943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,2,1,balanced,0.41198400656382245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,2,1,power_law_1.01,0.3241408109664917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,2,1,power_law_1.01,0.3318527936935425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,2,1,power_law_1.2,0.3215552091598511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,2,1,power_law_1.2,0.3224447965621948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,32,1,balanced,0.09188266595204671
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,32,1,balanced,0.09297600388526917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,32,1,power_law_1.01,0.08169599771499633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,32,1,power_law_1.01,0.08332160115242004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,32,1,power_law_1.2,0.08244479894638061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,32,1,power_law_1.2,0.08323839902877808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,4,1,balanced,0.22661866744359335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,4,1,balanced,0.22764799992243448
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,4,1,power_law_1.01,0.18559999465942384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,4,1,power_law_1.01,0.18649599552154542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,4,1,power_law_1.2,0.1857599973678589
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,4,1,power_law_1.2,0.18711040019989014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,8,1,balanced,0.14305599530537924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,8,1,balanced,0.1442346672217051
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,8,1,power_law_1.01,0.12065279483795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,8,1,power_law_1.01,0.1213312029838562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,8,1,power_law_1.2,0.12183680534362792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2048,8,256,8,1,power_law_1.2,0.122489595413208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,1,balanced,0.6206080118815104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,1,balanced,0.6212799946467081
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,1,power_law_1.01,0.5487936019897461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,1,power_law_1.01,0.5533440113067627
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,1,power_law_1.2,0.5509439945220947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,1,power_law_1.2,0.5612224102020263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,16,balanced,0.07653333246707916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,16,balanced,0.07659199833869934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,16,power_law_1.01,0.0733568012714386
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,16,power_law_1.01,0.07403519749641418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,16,power_law_1.2,0.07427200078964233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,16,power_law_1.2,0.07429760098457336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,2,balanced,0.32948267459869385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,2,balanced,0.3312319914499919
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,2,power_law_1.01,0.29465599060058595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,2,power_law_1.01,0.30176639556884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,2,power_law_1.2,0.3050879955291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,2,power_law_1.2,0.3097536087036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,32,balanced,0.07830933233102162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,32,balanced,0.07932800054550171
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,32,power_law_1.01,0.06978560090065003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,32,power_law_1.01,0.06991360187530518
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,32,power_law_1.2,0.06941440105438232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,32,power_law_1.2,0.06976640224456787
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,4,balanced,0.1843679944674174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,4,balanced,0.1848106582959493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,4,power_law_1.01,0.16764800548553466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,4,power_law_1.01,0.17034239768981935
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,4,power_law_1.2,0.1679487943649292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,4,power_law_1.2,0.16866559982299806
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,8,balanced,0.11105066537857056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,8,balanced,0.1127786636352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,8,power_law_1.01,0.10095360279083251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,8,power_law_1.01,0.10343680381774903
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,8,power_law_1.2,0.10362880229949951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,1,8,power_law_1.2,0.10421119928359986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,2,1,balanced,0.33347201347351074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,2,1,balanced,0.33635199069976807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,2,1,power_law_1.01,0.30056960582733155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,2,1,power_law_1.01,0.3020672082901001
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,2,1,power_law_1.2,0.3020224094390869
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,2,1,power_law_1.2,0.30376319885253905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,4,1,balanced,0.1936053236325582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,4,1,balanced,0.19397334257761636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,4,1,power_law_1.01,0.17601280212402343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,4,1,power_law_1.01,0.17984639406204223
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,4,1,power_law_1.2,0.17789440155029296
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,4,1,power_law_1.2,0.17958400249481202
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,8,1,balanced,0.11930132905642192
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,8,1,balanced,0.11932800213495891
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,8,1,power_law_1.01,0.11078399419784546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,8,1,power_law_1.01,0.11151360273361206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,8,1,power_law_1.2,0.11153919696807861
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,6144,2560,8,160,8,1,power_law_1.2,0.11345920562744141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,1,balanced,0.9084959824879965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,1,balanced,0.9085226853688558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,1,power_law_1.01,0.7052608013153077
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,1,power_law_1.01,0.7208320140838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,1,power_law_1.2,0.715993595123291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,1,power_law_1.2,0.7162816047668457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,128,balanced,0.0865119993686676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,128,balanced,0.0885759989420573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,128,power_law_1.01,0.08000640273094177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,128,power_law_1.01,0.08551040291786194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,128,power_law_1.2,0.07990400195121765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,128,power_law_1.2,0.08339840173721313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,16,balanced,0.09634133179982503
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,16,balanced,0.09779199957847595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,16,power_law_1.01,0.08761600255966187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,16,power_law_1.01,0.09044479727745056
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,16,power_law_1.2,0.08936960101127625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,16,power_law_1.2,0.089683198928833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,2,balanced,0.47306664784749347
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,2,balanced,0.4743573268254598
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,2,power_law_1.01,0.3865920066833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,2,power_law_1.01,0.39070720672607423
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,2,power_law_1.2,0.3688640117645264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,2,power_law_1.2,0.37985920906066895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,256,balanced,0.06284266710281372
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,256,balanced,0.06589333216349284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,256,power_law_1.01,0.056934398412704465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,256,power_law_1.01,0.06479359865188598
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,256,power_law_1.2,0.05539839863777161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,256,power_law_1.2,0.05689600110054016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,32,balanced,0.10072533289591472
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,32,balanced,0.1049173374970754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,32,power_law_1.01,0.08933759927749634
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,32,power_law_1.01,0.09075199961662292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,32,power_law_1.2,0.0886080026626587
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,32,power_law_1.2,0.09141119718551635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,4,balanced,0.25677865743637085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,4,balanced,0.2575040062268575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,4,power_law_1.01,0.22344319820404052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,4,power_law_1.01,0.23375999927520752
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,4,power_law_1.2,0.20791680812835694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,4,power_law_1.2,0.2107327938079834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,64,balanced,0.13457600275675455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,64,balanced,0.1370560030142466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,64,power_law_1.01,0.12301440238952636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,64,power_law_1.01,0.12332160472869873
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,64,power_law_1.2,0.12300800085067749
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,64,power_law_1.2,0.12826240062713623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,8,balanced,0.14850133657455444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,8,balanced,0.14858667055765787
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,8,power_law_1.01,0.1279039978981018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,8,power_law_1.01,0.13223040103912354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,8,power_law_1.2,0.13082239627838135
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,1,8,power_law_1.2,0.13432320356369018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,16,1,balanced,0.12295466661453247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,16,1,balanced,0.12441600362459819
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,16,1,power_law_1.01,0.10652799606323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,16,1,power_law_1.01,0.10703359842300415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,16,1,power_law_1.2,0.10536960363388062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,16,1,power_law_1.2,0.10625920295715333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,2,1,balanced,0.47350935141245526
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,2,1,balanced,0.4742506742477417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,2,1,power_law_1.01,0.3769023895263672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,2,1,power_law_1.01,0.3795264005661011
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,2,1,power_law_1.2,0.3699199914932251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,2,1,power_law_1.2,0.37027840614318847
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,32,1,balanced,0.10403733452161153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,32,1,balanced,0.10494933525721233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,32,1,power_law_1.01,0.09047039747238159
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,32,1,power_law_1.01,0.09159039855003356
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,32,1,power_law_1.2,0.09103360176086425
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,32,1,power_law_1.2,0.0937279999256134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,4,1,balanced,0.26071999470392865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,4,1,balanced,0.2615893284479777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,4,1,power_law_1.01,0.2118079900741577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,4,1,power_law_1.01,0.2170559883117676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,4,1,power_law_1.2,0.20689918994903564
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,4,1,power_law_1.2,0.211411190032959
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,8,1,balanced,0.16245333353678384
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,8,1,balanced,0.1642400026321411
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,8,1,power_law_1.01,0.13693439960479736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,8,1,power_law_1.01,0.1378368020057678
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,8,1,power_law_1.2,0.13697279691696168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,256,8,1,power_law_1.2,0.13789440393447877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,1,balanced,1.334346612294515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,1,balanced,1.335429350535075
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,1,power_law_1.01,0.9097855567932129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,1,power_law_1.01,0.9267200469970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,1,power_law_1.2,0.9040703773498535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,1,power_law_1.2,0.9209471702575683
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,128,balanced,0.10563733180363973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,128,balanced,0.110944002866745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,128,power_law_1.01,0.10496640205383301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,128,power_law_1.01,0.10714240074157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,128,power_law_1.2,0.09515519738197327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,128,power_law_1.2,0.10585600137710571
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,16,balanced,0.1223360002040863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,16,balanced,0.12299733360608418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,16,power_law_1.01,0.10619519948959351
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,16,power_law_1.01,0.10696959495544434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,16,power_law_1.2,0.10364799499511719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,16,power_law_1.2,0.11103359460830689
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,2,balanced,0.6860853036244711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,2,balanced,0.6869866847991943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,2,power_law_1.01,0.5281280040740967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,2,power_law_1.01,0.5282432079315186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,2,power_law_1.2,0.5063807964324951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,2,power_law_1.2,0.5071487903594971
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,32,balanced,0.08091199894746144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,32,balanced,0.08211733400821686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,32,power_law_1.01,0.0756608009338379
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,32,power_law_1.01,0.077811199426651
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,32,power_law_1.2,0.07100160121917724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,32,power_law_1.2,0.07317119836807251
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,4,balanced,0.36236266295115155
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,4,balanced,0.36264534791310626
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,4,power_law_1.01,0.32252159118652346
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,4,power_law_1.01,0.3337791919708252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,4,power_law_1.2,0.2684927940368652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,4,power_law_1.2,0.29706239700317383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,64,balanced,0.0881813367207845
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,64,balanced,0.09188266595204671
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,64,power_law_1.01,0.07881600260734559
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,64,power_law_1.01,0.08231679797172546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,64,power_law_1.2,0.07908480167388916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,64,power_law_1.2,0.08259199857711792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,8,balanced,0.20267200469970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,8,balanced,0.20314133167266846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,8,power_law_1.01,0.16506240367889405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,8,power_law_1.01,0.1651584029197693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,8,power_law_1.2,0.17099519968032836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,1,8,power_law_1.2,0.1949504017829895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,16,1,balanced,0.1632960041364034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,16,1,balanced,0.16410666704177856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,16,1,power_law_1.01,0.12748160362243652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,16,1,power_law_1.01,0.13036799430847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,16,1,power_law_1.2,0.12713600397109986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,16,1,power_law_1.2,0.12732160091400146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,2,1,balanced,0.6897280216217041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,2,1,balanced,0.6900746822357178
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,2,1,power_law_1.01,0.4857600212097168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,2,1,power_law_1.01,0.4927999973297119
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,2,1,power_law_1.2,0.47132158279418945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,2,1,power_law_1.2,0.4763455867767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,32,1,balanced,0.1344266633192698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,32,1,balanced,0.13595199584960938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,32,1,power_law_1.01,0.10762239694595337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,32,1,power_law_1.01,0.10927360057830811
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,32,1,power_law_1.2,0.10736639499664306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,32,1,power_law_1.2,0.10779520273208618
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,4,1,balanced,0.3684053421020508
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,4,1,balanced,0.3690933386484782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,4,1,power_law_1.01,0.2655488014221191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,4,1,power_law_1.01,0.2688127994537354
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,4,1,power_law_1.2,0.26432640552520753
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,4,1,power_law_1.2,0.26472959518432615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,8,1,balanced,0.22006400426228842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,8,1,balanced,0.2207146684328715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,8,1,power_law_1.01,0.16761599779129027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,8,1,power_law_1.01,0.16764800548553466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,8,1,power_law_1.2,0.16638720035552979
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,80,7168,2048,8,384,8,1,power_law_1.2,0.1672767996788025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,1,balanced,0.43943464756011963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,1,balanced,0.44542932510375977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,1,power_law_1.01,0.47664642333984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,1,power_law_1.01,0.4878592014312744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,1,power_law_1.2,0.48891520500183105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,1,power_law_1.2,0.48930559158325193
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,128,balanced,0.10796266794204712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,128,balanced,0.10946133732795715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,128,power_law_1.01,0.12613120079040527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,128,power_law_1.01,0.12773120403289795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,128,power_law_1.2,0.143014395236969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,128,power_law_1.2,0.1451647996902466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,16,balanced,0.12797333796819052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,16,balanced,0.1283146639664968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,16,power_law_1.01,0.15765119791030885
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,16,power_law_1.01,0.16005120277404786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,16,power_law_1.2,0.17049599885940553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,16,power_law_1.2,0.1890239953994751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,2,balanced,0.27401600281397503
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,2,balanced,0.27452266216278076
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,2,power_law_1.01,0.317523193359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,2,power_law_1.01,0.33242239952087405
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,2,power_law_1.2,0.3242624044418335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,2,power_law_1.2,0.34596478939056396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,32,balanced,0.11743467052777608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,32,balanced,0.11958932876586914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,32,power_law_1.01,0.13955199718475342
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,32,power_law_1.01,0.14424959421157837
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,32,power_law_1.2,0.15279359817504884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,32,power_law_1.2,0.15691519975662233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,4,balanced,0.19102933009465536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,4,balanced,0.19123733043670654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,4,power_law_1.01,0.22551040649414061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,4,power_law_1.01,0.22728960514068602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,4,power_law_1.2,0.2400576114654541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,4,power_law_1.2,0.2593408107757568
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,64,balanced,0.1107413371404012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,64,balanced,0.11133333047231038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,64,power_law_1.01,0.13349119424819947
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,64,power_law_1.01,0.1358847975730896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,64,power_law_1.2,0.14882559776306153
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,64,power_law_1.2,0.15244799852371216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,8,balanced,0.1502293348312378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,8,balanced,0.1504639983177185
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,8,power_law_1.01,0.1796031951904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,8,power_law_1.01,0.1890176057815552
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,8,power_law_1.2,0.19971840381622313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,1,8,power_law_1.2,0.2027967929840088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,2,1,balanced,0.3294080098470052
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,2,1,balanced,0.33084267377853394
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,2,1,power_law_1.01,0.3482624053955078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,2,1,power_law_1.01,0.35041279792785646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,2,1,power_law_1.2,0.3510207891464233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,2,1,power_law_1.2,0.3537856101989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,4,1,balanced,0.28566932678222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,4,1,balanced,0.28617600599924725
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,4,1,power_law_1.01,0.29701759815216067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,4,1,power_law_1.01,0.29796481132507324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,4,1,power_law_1.2,0.29989759922027587
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,2048,768,8,128,4,1,power_law_1.2,0.3003328084945679
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,1,balanced,0.8272639910380045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,1,balanced,0.8337013721466064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,1,power_law_1.01,0.9984895706176757
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,1,power_law_1.01,1.0058367729187012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,1,power_law_1.2,1.0259072303771972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,1,power_law_1.2,1.0368063926696778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,128,balanced,0.15237333377202353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,128,balanced,0.1534293293952942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,128,power_law_1.01,0.17431039810180665
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,128,power_law_1.01,0.17579519748687744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,128,power_law_1.2,0.19743360280990602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,128,power_law_1.2,0.20102400779724122
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,16,balanced,0.1925813357035319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,16,balanced,0.19362133741378784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,16,power_law_1.01,0.23648641109466553
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,16,power_law_1.01,0.23657600879669188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,16,power_law_1.2,0.2517119884490967
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,16,power_law_1.2,0.27012479305267334
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,2,balanced,0.473690668741862
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,2,balanced,0.47519465287526447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,2,power_law_1.01,0.5918591976165771
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,2,power_law_1.01,0.6066368103027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,2,power_law_1.2,0.6009600162506104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,2,power_law_1.2,0.661843204498291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,256,balanced,0.1508693297704061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,256,balanced,0.15171200037002563
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,256,power_law_1.01,0.16868480443954467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,256,power_law_1.01,0.17279360294342042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,256,power_law_1.2,0.18384640216827391
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,256,power_law_1.2,0.1942911982536316
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,32,balanced,0.16804265975952148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,32,balanced,0.16880534092585245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,32,power_law_1.01,0.20182399749755858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,32,power_law_1.01,0.20833919048309327
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,32,power_law_1.2,0.221068811416626
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,32,power_law_1.2,0.22832000255584717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,4,balanced,0.31353066364924115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,4,balanced,0.31406400601069134
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,4,power_law_1.01,0.3926016092300415
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,4,power_law_1.01,0.406496000289917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,4,power_law_1.2,0.41918721199035647
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,4,power_law_1.2,0.42609281539916993
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,64,balanced,0.15771200259526572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,64,balanced,0.15889066457748413
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,64,power_law_1.01,0.18705919981002808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,64,power_law_1.01,0.18910080194473267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,64,power_law_1.2,0.20661120414733886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,64,power_law_1.2,0.20890240669250487
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,8,balanced,0.23401600122451782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,8,balanced,0.23449599742889404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,8,power_law_1.01,0.28492159843444825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,8,power_law_1.01,0.2972287893295288
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,8,power_law_1.2,0.3172800064086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,1,8,power_law_1.2,0.3212480068206787
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,2,1,balanced,0.5329226652781168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,2,1,balanced,0.533951997756958
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,2,1,power_law_1.01,0.6288959980010986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,2,1,power_law_1.01,0.6326911926269532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,2,1,power_law_1.2,0.645088005065918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,2,1,power_law_1.2,0.646457576751709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,4,1,balanced,0.40748266379038495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,4,1,balanced,0.4088746706644694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,4,1,power_law_1.01,0.4651328086853027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,4,1,power_law_1.01,0.46561279296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,4,1,power_law_1.2,0.4764224052429199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,4,1,power_law_1.2,0.48033919334411623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,8,1,balanced,0.36090131600697833
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,8,1,balanced,0.36324799060821533
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,8,1,power_law_1.01,0.4052159786224365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,8,1,power_law_1.01,0.40534400939941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,8,1,power_law_1.2,0.41252479553222654
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,3072,1536,8,256,8,1,power_law_1.2,0.41834239959716796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,1,balanced,1.6794026692708333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,1,balanced,1.6817013422648113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,1,power_law_1.01,1.7282304763793945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,1,power_law_1.01,1.7302207946777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,1,power_law_1.2,1.713043212890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,1,power_law_1.2,1.7682624816894532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,2,balanced,0.8969866434733073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,2,balanced,0.909290631612142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,2,power_law_1.01,1.2085375785827637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,2,power_law_1.01,1.2376511573791504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,2,power_law_1.2,1.192518424987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,2,power_law_1.2,1.293727970123291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,4,balanced,0.5316480000813802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,4,balanced,0.5328853527704874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,4,power_law_1.01,0.9232640266418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,4,power_law_1.01,0.9369152069091797
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,4,power_law_1.2,0.9382143974304199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,4,power_law_1.2,1.2373184204101562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,8,balanced,0.35228800773620605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,8,balanced,0.3527466853459676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,8,power_law_1.01,0.8459456443786622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,8,power_law_1.01,0.8761024475097656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,8,power_law_1.2,0.8704192161560058
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,1,8,power_law_1.2,0.8811840057373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,16,1,balanced,0.2929226756095886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,16,1,balanced,0.2936319907506307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,16,1,power_law_1.01,0.2944960117340088
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,16,1,power_law_1.01,0.2959104061126709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,16,1,power_law_1.2,0.2930943965911865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,16,1,power_law_1.2,0.29324800968170167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,2,1,balanced,0.902949333190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,2,1,balanced,0.9046719868977865
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,2,1,power_law_1.01,0.9409215927124024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,2,1,power_law_1.01,0.9477439880371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,2,1,power_law_1.2,0.9351424217224121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,2,1,power_law_1.2,0.9497471809387207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,32,1,balanced,0.25036799907684326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,32,1,balanced,0.25071465969085693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,32,1,power_law_1.01,0.252128005027771
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,32,1,power_law_1.01,0.2523008108139038
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,32,1,power_law_1.2,0.2524991989135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,32,1,power_law_1.2,0.2533632040023804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,4,1,balanced,0.5529706478118896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,4,1,balanced,0.5537759860356649
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,4,1,power_law_1.01,0.5611392021179199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,4,1,power_law_1.01,0.5666944026947022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,4,1,power_law_1.2,0.5633408069610596
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,4,1,power_law_1.2,0.567628812789917
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,8,1,balanced,0.3774293263753255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,8,1,balanced,0.3778666655222575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,8,1,power_law_1.01,0.3831360101699829
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,8,1,power_law_1.01,0.3834624052047729
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,8,1,power_law_1.2,0.37985279560089114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,14336,2,8,8,1,power_law_1.2,0.388972806930542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,1,balanced,0.9622666835784912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,1,balanced,0.967573324839274
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,1,power_law_1.01,1.0705408096313476
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,1,power_law_1.01,1.0707776069641113
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,1,power_law_1.2,1.0774144172668456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,1,power_law_1.2,1.1000127792358398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,128,balanced,0.18729066848754883
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,128,balanced,0.18825066089630127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,128,power_law_1.01,0.2297663927078247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,128,power_law_1.01,0.23088641166687013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,128,power_law_1.2,0.26489601135253904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,128,power_law_1.2,0.2671488046646118
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,16,balanced,0.23174933592478433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,16,balanced,0.23360532522201538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,16,power_law_1.01,0.29040639400482177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,16,power_law_1.01,0.3
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,16,power_law_1.2,0.322540807723999
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,16,power_law_1.2,0.32499840259552004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,2,balanced,0.5486720005671183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,2,balanced,0.5499893426895142
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,2,power_law_1.01,0.6455359935760498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,2,power_law_1.01,0.6676864147186279
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,2,power_law_1.2,0.6831999778747558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,2,power_law_1.2,0.7078080177307129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,32,balanced,0.20509866873423258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,32,balanced,0.20549867550532022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,32,power_law_1.01,0.25571839809417723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,32,power_law_1.01,0.25847039222717283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,32,power_law_1.2,0.2782399892807007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,32,power_law_1.2,0.2899264097213745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,4,balanced,0.36315735181172687
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,4,balanced,0.364303986231486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,4,power_law_1.01,0.44225921630859377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,4,power_law_1.01,0.5144000053405762
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,4,power_law_1.2,0.47487359046936034
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,4,power_law_1.2,0.4914815902709961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,64,balanced,0.1947093407313029
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,64,balanced,0.19512534141540527
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,64,power_law_1.01,0.23863680362701417
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,64,power_law_1.01,0.2432255983352661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,64,power_law_1.2,0.27409279346466064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,64,power_law_1.2,0.2852992057800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,8,balanced,0.27587199211120605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,8,balanced,0.27688000599543255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,8,power_law_1.01,0.35978240966796876
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,8,power_law_1.01,0.3735872030258179
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,8,power_law_1.2,0.3693824052810669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,1,8,power_law_1.2,0.3721024036407471
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,2,1,balanced,0.636901338895162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,2,1,balanced,0.639520009358724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,2,1,power_law_1.01,0.6924608230590821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,2,1,power_law_1.01,0.6925312042236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,2,1,power_law_1.2,0.6954432010650635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,2,1,power_law_1.2,0.699283218383789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,4,1,balanced,0.49753065903981525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,4,1,balanced,0.49932801723480225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,4,1,power_law_1.01,0.5282688140869141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,4,1,power_law_1.01,0.5341824054718017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,4,1,power_law_1.2,0.5359488010406495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,4,1,power_law_1.2,0.5394879817962647
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,8,1,balanced,0.4490079879760742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,8,1,balanced,0.44915199279785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,8,1,power_law_1.01,0.4699967861175537
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,8,1,power_law_1.01,0.4761343955993652
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,8,1,power_law_1.2,0.4738880157470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,4096,1536,8,128,8,1,power_law_1.2,0.47390079498291016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,1,balanced,3.2708266576131186
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,1,balanced,3.2876853942871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,1,power_law_1.01,3.4012481689453127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,1,power_law_1.01,3.4797630310058594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,1,power_law_1.2,3.2903297424316404
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,1,power_law_1.2,3.4336318969726562
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,2,balanced,1.7351360321044922
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,2,balanced,1.7522560755411785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,2,power_law_1.01,1.903116798400879
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,2,power_law_1.01,2.3169727325439453
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,2,power_law_1.2,2.3795391082763673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,2,power_law_1.2,2.5603904724121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,4,balanced,0.939130703608195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,4,balanced,0.9453653494517008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,4,power_law_1.01,2.0122432708740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,4,power_law_1.01,2.064569664001465
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,4,power_law_1.2,1.8475519180297852
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,4,power_law_1.2,1.852454376220703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,8,balanced,0.5528479814529419
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,8,balanced,0.5607359806696574
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,8,power_law_1.01,1.6330432891845703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,8,power_law_1.01,1.634694480895996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,8,power_law_1.2,1.6631040573120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,1,8,power_law_1.2,1.73187198638916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,16,1,balanced,0.416431983311971
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,16,1,balanced,0.4168320099512736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,16,1,power_law_1.01,0.4223423957824707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,16,1,power_law_1.01,0.4242879867553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,16,1,power_law_1.2,0.4223423957824707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,16,1,power_law_1.2,0.42255358695983886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,2,1,balanced,1.4591679573059082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,2,1,balanced,1.463253339131673
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,2,1,power_law_1.01,1.4812543869018555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,2,1,power_law_1.01,1.5095423698425292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,2,1,power_law_1.2,1.5079296112060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,2,1,power_law_1.2,1.5138367652893066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,32,1,balanced,0.34601600964864093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,32,1,balanced,0.34703465302785236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,32,1,power_law_1.01,0.3534976005554199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,32,1,power_law_1.01,0.3541120052337646
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,32,1,power_law_1.2,0.3524928092956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,32,1,power_law_1.2,0.35335679054260255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,4,1,balanced,0.855557362238566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,4,1,balanced,0.8573226928710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,4,1,power_law_1.01,0.8895615577697754
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,4,1,power_law_1.01,0.8906368255615235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,4,1,power_law_1.2,0.8784959793090821
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,4,1,power_law_1.2,0.8964223861694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,8,1,balanced,0.5657333135604858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,8,1,balanced,0.5683573484420776
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,8,1,power_law_1.01,0.5784768104553223
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,8,1,power_law_1.01,0.5802112102508545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,8,1,power_law_1.2,0.5720384120941162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,16384,2,8,8,1,power_law_1.2,0.5763904094696045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,1,balanced,1.8629013697306316
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,1,balanced,1.8738880157470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,1,power_law_1.01,2.2925952911376952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,1,power_law_1.01,2.2940736770629884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,1,power_law_1.2,2.3489599227905273
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,1,power_law_1.2,2.354047966003418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,128,balanced,0.26175999641418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,128,balanced,0.2632906635602315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,128,power_law_1.01,0.31111679077148435
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,128,power_law_1.01,0.3143104076385498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,128,power_law_1.2,0.348799991607666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,128,power_law_1.2,0.3644864082336426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,16,balanced,0.3389546473821004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,16,balanced,0.34038400650024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,16,power_law_1.01,0.43915519714355467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,16,power_law_1.01,0.45041279792785643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,16,power_law_1.2,0.47599358558654786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,16,power_law_1.2,0.4938047885894775
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,2,balanced,1.0262826283772786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,2,balanced,1.0304053624471028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,2,power_law_1.01,1.2995136260986329
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,2,power_law_1.01,1.3003328323364258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,2,power_law_1.2,1.3471936225891112
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,2,power_law_1.2,1.4403391838073731
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,256,balanced,0.2595626711845398
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,256,balanced,0.2609493335088094
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,256,power_law_1.01,0.29580800533294677
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,256,power_law_1.01,0.29813759326934813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,256,power_law_1.2,0.34152960777282715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,256,power_law_1.2,0.34985599517822263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,32,balanced,0.2999573349952698
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,32,balanced,0.30003199974695843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,32,power_law_1.01,0.3801919937133789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,32,power_law_1.01,0.3817728042602539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,32,power_law_1.2,0.4102208137512207
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,32,power_law_1.2,0.43128318786621095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,4,balanced,0.6208106676737467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,4,balanced,0.6227519909540812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,4,power_law_1.01,0.7939136028289795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,4,power_law_1.01,0.8006527900695801
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,4,power_law_1.2,0.8472576141357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,4,power_law_1.2,0.8486656188964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,64,balanced,0.27383466561635333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,64,balanced,0.27562665939331055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,64,power_law_1.01,0.33599998950958254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,64,power_law_1.01,0.35382399559020994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,64,power_law_1.2,0.3673727989196777
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,64,power_law_1.2,0.37556478977203367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,8,balanced,0.43093868096669513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,8,balanced,0.43133334318796795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,8,power_law_1.01,0.5809599876403808
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,8,power_law_1.01,0.5841599941253662
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,8,power_law_1.2,0.593503999710083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,1,8,power_law_1.2,0.595308780670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,16,1,balanced,0.5707039833068848
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,16,1,balanced,0.5735626618067423
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,16,1,power_law_1.01,0.6200704097747802
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,16,1,power_law_1.01,0.620684814453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,16,1,power_law_1.2,0.6314943790435791
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,16,1,power_law_1.2,0.6383488178253174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,2,1,balanced,1.1254773139953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,2,1,balanced,1.1254879633585613
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,2,1,power_law_1.01,1.350374412536621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,2,1,power_law_1.01,1.3548992156982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,2,1,power_law_1.2,1.3851584434509276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,2,1,power_law_1.2,1.3889599800109864
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,32,1,balanced,0.5830986499786377
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,32,1,balanced,0.5860960086186727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,32,1,power_law_1.01,0.6348095893859863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,32,1,power_law_1.01,0.6349376201629638
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,32,1,power_law_1.2,0.6456704139709473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,32,1,power_law_1.2,0.6576255798339844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,4,1,balanced,0.7859146595001221
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,4,1,balanced,0.7871092955271403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,4,1,power_law_1.01,0.894752025604248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,4,1,power_law_1.01,0.9077568054199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,4,1,power_law_1.2,0.9305536270141601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,4,1,power_law_1.2,0.9325119972229003
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,8,1,balanced,0.6335999965667725
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,8,1,balanced,0.6345173517862955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,8,1,power_law_1.01,0.6996032238006592
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,8,1,power_law_1.01,0.7005055904388428
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,8,1,power_law_1.2,0.7245567798614502
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2048,8,256,8,1,power_law_1.2,0.7269375801086426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,1,balanced,3.7064479192097983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,1,balanced,3.7150398890177407
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,1,power_law_1.01,2.4447872161865236
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,1,power_law_1.01,2.4468799591064454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,1,power_law_1.2,2.4637887954711912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,1,power_law_1.2,2.4895679473876955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,16,balanced,0.37916799386342365
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,16,balanced,0.3797973394393921
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,16,power_law_1.01,0.49974398612976073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,16,power_law_1.01,0.5121088027954102
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,16,power_law_1.2,0.5406527996063233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,16,power_law_1.2,0.5469888210296631
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,2,balanced,1.516874631245931
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,2,balanced,1.524778683980306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,2,power_law_1.01,1.3395071983337403
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,2,power_law_1.01,1.4076095581054688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,2,power_law_1.2,1.4165247917175292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,2,power_law_1.2,1.5752896308898925
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,32,balanced,0.3201120098431905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,32,balanced,0.32067734003067017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,32,power_law_1.01,0.415008020401001
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,32,power_law_1.01,0.41687679290771484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,32,power_law_1.2,0.48349437713623045
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,32,power_law_1.2,0.49524478912353515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,4,balanced,0.7596960067749023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,4,balanced,0.7640960216522217
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,4,power_law_1.01,0.9128767967224121
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,4,power_law_1.01,0.9308095932006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,4,power_law_1.2,0.8871616363525391
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,4,power_law_1.2,0.9187456130981445
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,8,balanced,0.5044960180918375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,8,balanced,0.5086506605148315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,8,power_law_1.01,0.5965760231018067
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,8,power_law_1.01,0.6380735874176026
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,8,power_law_1.2,0.7042240142822266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,1,8,power_law_1.2,0.7418367862701416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,2,1,balanced,2.122154712677002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,2,1,balanced,2.126858711242676
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,2,1,power_law_1.01,1.4377535820007323
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,2,1,power_law_1.01,1.4440704345703126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,2,1,power_law_1.2,1.4332223892211915
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,2,1,power_law_1.2,1.4517375946044921
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,4,1,balanced,1.31113600730896
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,4,1,balanced,1.317834695180257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,4,1,power_law_1.01,0.9544960021972656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,4,1,power_law_1.01,0.9594047546386719
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,4,1,power_law_1.2,0.9721280097961426
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,4,1,power_law_1.2,0.9828672409057617
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,8,1,balanced,0.9940693378448486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,8,1,balanced,1.000069300333659
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,8,1,power_law_1.01,0.7720191955566407
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,8,1,power_law_1.01,0.7813119888305664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,8,1,power_law_1.2,0.7805247783660889
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,6144,2560,8,160,8,1,power_law_1.2,0.782751989364624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,1,balanced,2.1345067024230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,1,balanced,2.1822880109151206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,1,power_law_1.01,2.6847551345825194
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,1,power_law_1.01,2.691129684448242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,1,power_law_1.2,2.7583744049072267
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,1,power_law_1.2,2.781491279602051
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,128,balanced,0.299621323744456
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,128,balanced,0.3015146652857463
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,128,power_law_1.01,0.35187840461730957
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,128,power_law_1.01,0.3596224069595337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,128,power_law_1.2,0.4040703773498535
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,128,power_law_1.2,0.41877760887146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,16,balanced,0.38810133934020996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,16,balanced,0.38977599143981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,16,power_law_1.01,0.5051199913024902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,16,power_law_1.01,0.5101119995117187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,16,power_law_1.2,0.5472383975982666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,16,power_law_1.2,0.5849023818969726
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,2,balanced,1.172426700592041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,2,balanced,1.1937386989593506
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,2,power_law_1.01,1.4555007934570312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,2,power_law_1.01,1.5809920310974122
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,2,power_law_1.2,1.5993535995483399
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,2,power_law_1.2,1.6253376007080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,256,balanced,0.2953760027885437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,256,balanced,0.29600000381469727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,256,power_law_1.01,0.3367232084274292
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,256,power_law_1.01,0.33748478889465333
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,256,power_law_1.2,0.374566388130188
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,256,power_law_1.2,0.3937407970428467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,32,balanced,0.3413279851277669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,32,balanced,0.34249599774678546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,32,power_law_1.01,0.4366720199584961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,32,power_law_1.01,0.4372288227081299
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,32,power_law_1.2,0.4654975891113281
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,32,power_law_1.2,0.5041215896606446
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,4,balanced,0.7138453324635824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,4,balanced,0.7182880242665609
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,4,power_law_1.01,0.925055980682373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,4,power_law_1.01,0.9337856292724609
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,4,power_law_1.2,0.9944831848144531
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,4,power_law_1.2,1.0166912078857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,64,balanced,0.3139626582463582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,64,balanced,0.315829336643219
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,64,power_law_1.01,0.3882816076278687
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,64,power_law_1.01,0.3885632038116455
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,64,power_law_1.2,0.4352255821228027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,64,power_law_1.2,0.4384960174560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,8,balanced,0.4941546519597371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,8,balanced,0.4969173272450765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,8,power_law_1.01,0.649561595916748
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,8,power_law_1.01,0.6543871879577636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,8,power_law_1.2,0.7088768005371093
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,1,8,power_law_1.2,0.7192768096923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,16,1,balanced,0.6491039991378784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,16,1,balanced,0.6501866579055786
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,16,1,power_law_1.01,0.7151616096496582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,16,1,power_law_1.01,0.715999984741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,16,1,power_law_1.2,0.7305151939392089
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,16,1,power_law_1.2,0.73405442237854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,2,1,balanced,1.2977973620096843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,2,1,balanced,1.3033653100331624
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,2,1,power_law_1.01,1.565401554107666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,2,1,power_law_1.01,1.5979071617126466
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,2,1,power_law_1.2,1.6121728897094727
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,2,1,power_law_1.2,1.6401664733886718
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,32,1,balanced,0.6653333504994711
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,32,1,balanced,0.6658026774724325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,32,1,power_law_1.01,0.7236095905303955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,32,1,power_law_1.01,0.7267392158508301
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,32,1,power_law_1.2,0.7440512180328369
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,32,1,power_law_1.2,0.7543039798736573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,4,1,balanced,0.9014986356099447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,4,1,balanced,0.9091467062632242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,4,1,power_law_1.01,1.0400639533996583
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,4,1,power_law_1.01,1.0500415802001952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,4,1,power_law_1.2,1.0666111946105956
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,4,1,power_law_1.2,1.082380771636963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,8,1,balanced,0.7228533426920573
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,8,1,balanced,0.7234559853871664
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,8,1,power_law_1.01,0.816864013671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,8,1,power_law_1.01,0.8175423622131348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,8,1,power_law_1.2,0.8224384307861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,256,8,1,power_law_1.2,0.8345855712890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,1,balanced,6.254922866821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,1,balanced,6.31117312113444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,1,power_law_1.01,3.0031999588012694
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,1,power_law_1.01,3.011494445800781
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,1,power_law_1.2,3.1828479766845703
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,1,power_law_1.2,3.200447845458984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,128,balanced,0.30795733133951825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,128,balanced,0.31170133749643963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,128,power_law_1.01,0.3498879909515381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,128,power_law_1.01,0.3525952100753784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,128,power_law_1.2,0.3828160047531128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,128,power_law_1.2,0.390662407875061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,16,balanced,0.43987735112508136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,16,balanced,0.44092798233032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,16,power_law_1.01,0.5212736129760742
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,16,power_law_1.01,0.5275712013244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,16,power_law_1.2,0.5391488075256348
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,16,power_law_1.2,0.5720384120941162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,2,balanced,2.2217280069986978
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,2,balanced,2.2537919680277505
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,2,power_law_1.01,1.6881536483764648
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,2,power_law_1.01,1.6965055465698242
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,2,power_law_1.2,1.7849536895751954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,2,power_law_1.2,1.8009088516235352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,32,balanced,0.36606931686401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,32,balanced,0.36737600962320965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,32,power_law_1.01,0.4200128078460693
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,32,power_law_1.01,0.4266047954559326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,32,power_law_1.2,0.4612864017486572
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,32,power_law_1.2,0.46474881172180177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,4,balanced,0.8939200242360433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,4,balanced,0.909226655960083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,4,power_law_1.01,1.0034175872802735
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,4,power_law_1.01,1.0086015701293944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,4,power_law_1.2,1.0725567817687989
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,4,power_law_1.2,1.1133952140808105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,64,balanced,0.32548266649246216
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,64,balanced,0.3264586726824443
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,64,power_law_1.01,0.3729856014251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,64,power_law_1.01,0.3894144058227539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,64,power_law_1.2,0.41510400772094724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,64,power_law_1.2,0.42376317977905276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,8,balanced,0.5989386638005575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,8,balanced,0.6022080183029175
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,8,power_law_1.01,0.6726975917816163
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,8,power_law_1.01,0.685811185836792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,8,power_law_1.2,0.729414415359497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,1,8,power_law_1.2,0.7329279899597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,16,1,balanced,0.9273173014322916
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,16,1,balanced,0.9278240203857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,16,1,power_law_1.01,0.747046422958374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,16,1,power_law_1.01,0.7488319873809814
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,16,1,power_law_1.2,0.7642752170562744
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,16,1,power_law_1.2,0.7655360221862793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,2,1,balanced,2.9849065144856772
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,2,1,balanced,2.996437390645345
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,2,1,power_law_1.01,1.7236223220825195
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,2,1,power_law_1.01,1.7305023193359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,2,1,power_law_1.2,1.8244735717773437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,2,1,power_law_1.2,1.8380096435546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,32,1,balanced,0.9170026779174805
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,32,1,balanced,0.9173440138498942
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,32,1,power_law_1.01,0.7649087905883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,32,1,power_law_1.01,0.7657087802886963
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,32,1,power_law_1.2,0.7847551822662353
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,32,1,power_law_1.2,0.7933375835418701
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,4,1,balanced,1.7691946029663086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,4,1,balanced,1.771557331085205
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,4,1,power_law_1.01,1.1192000389099122
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,4,1,power_law_1.01,1.1262592315673827
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,4,1,power_law_1.2,1.1775424003601074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,4,1,power_law_1.2,1.1868672370910645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,8,1,balanced,1.1970667044321697
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,8,1,balanced,1.2010613282521565
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,8,1,power_law_1.01,0.8588031768798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,8,1,power_law_1.01,0.8618816375732422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,8,1,power_law_1.2,0.8834495544433594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,8192,7168,2048,8,384,8,1,power_law_1.2,0.8862591743469238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,1,balanced,0.08368000388145447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,1,balanced,0.0846560001373291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,1,power_law_1.01,0.08035839796066284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,1,power_law_1.01,0.08253440260887146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,1,power_law_1.2,0.0815999984741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,1,power_law_1.2,0.08199040293693542
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,128,balanced,0.03611200054486593
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,128,balanced,0.03750933210055033
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,128,power_law_1.01,0.034169599413871765
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,128,power_law_1.01,0.03511680066585541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,128,power_law_1.2,0.03369599878787995
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,128,power_law_1.2,0.034220799803733826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,16,balanced,0.033333333830038704
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,16,balanced,0.03333866596221924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,16,power_law_1.01,0.03189760148525238
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,16,power_law_1.01,0.03214080035686493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,16,power_law_1.2,0.03224320113658905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,16,power_law_1.2,0.03247359991073608
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,2,balanced,0.05917333563168844
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,2,balanced,0.059392000238100685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,2,power_law_1.01,0.05793280005455017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,2,power_law_1.01,0.05859839916229248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,2,power_law_1.2,0.05777279734611511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,2,power_law_1.2,0.05867519974708557
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,32,balanced,0.03806400050719579
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,32,balanced,0.03915733347336451
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,32,power_law_1.01,0.0361407995223999
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,32,power_law_1.01,0.03646079897880554
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,32,power_law_1.2,0.03592320084571839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,32,power_law_1.2,0.03624959886074066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,4,balanced,0.03871466716130575
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,4,balanced,0.04032533367474874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,4,power_law_1.01,0.039059200882911684
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,4,power_law_1.01,0.039827200770378116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,4,power_law_1.2,0.0394239991903305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,4,power_law_1.2,0.039776000380516055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,64,balanced,0.0356480007370313
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,64,balanced,0.03751466671625773
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,64,power_law_1.01,0.0348800003528595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,64,power_law_1.01,0.035718399286270144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,64,power_law_1.2,0.03445119857788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,64,power_law_1.2,0.03454079926013946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,8,balanced,0.03541333228349686
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,8,balanced,0.03568000098069509
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,8,power_law_1.01,0.03377279937267304
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,8,power_law_1.01,0.03383040130138397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,8,power_law_1.2,0.03454079926013946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,1,8,power_law_1.2,0.03461759984493255
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,2,1,balanced,0.06115200122197469
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,2,1,balanced,0.062309334675470986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,2,1,power_law_1.01,0.06024320125579834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,2,1,power_law_1.01,0.06146559715270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,2,1,power_law_1.2,0.05818880200386047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,2,1,power_law_1.2,0.05939199924468994
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,4,1,balanced,0.0420959989229838
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,4,1,balanced,0.04367466767628988
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,4,1,power_law_1.01,0.04431360065937042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,4,1,power_law_1.01,0.046489599347114566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,4,1,power_law_1.2,0.04493440091609955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,2048,768,8,128,4,1,power_law_1.2,0.04618239998817444
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,1,balanced,0.3149120012919108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,1,balanced,0.3155946731567383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,1,power_law_1.01,0.25219199657440183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,1,power_law_1.01,0.2585088014602661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,1,power_law_1.2,0.25811200141906737
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,1,power_law_1.2,0.2581248044967651
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,128,balanced,0.039664000272750854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,128,balanced,0.04053333401679993
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,128,power_law_1.01,0.038649600744247434
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,128,power_law_1.01,0.03918080031871796
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,128,power_law_1.2,0.038873600959777835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,128,power_law_1.2,0.03887999951839447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,16,balanced,0.054042667150497437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,16,balanced,0.05406400064627329
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,16,power_law_1.01,0.048556798696517946
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,16,power_law_1.01,0.04948480129241943
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,16,power_law_1.2,0.04713599979877472
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,16,power_law_1.2,0.04787839949131012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,2,balanced,0.1744906703631083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,2,balanced,0.17483733097712198
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,2,power_law_1.01,0.14458880424499512
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,2,power_law_1.01,0.1475391983985901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,2,power_law_1.2,0.14154239892959594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,2,power_law_1.2,0.14926719665527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,256,balanced,0.0395413339138031
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,256,balanced,0.039781334499518074
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,256,power_law_1.01,0.03761920034885406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,256,power_law_1.01,0.03837440013885498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,256,power_law_1.2,0.037350401282310486
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,256,power_law_1.2,0.037811198830604555
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,32,balanced,0.039690665900707245
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,32,balanced,0.039813332259655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,32,power_law_1.01,0.03694719970226288
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,32,power_law_1.01,0.03869439959526062
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,32,power_law_1.2,0.03777920007705689
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,32,power_law_1.2,0.0383679986000061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,4,balanced,0.10468266407648723
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,4,balanced,0.10539733370145161
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,4,power_law_1.01,0.09052799940109253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,4,power_law_1.01,0.09281280040740966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,4,power_law_1.2,0.08734719753265381
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,4,power_law_1.2,0.0918079972267151
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,64,balanced,0.04373333354791006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,64,balanced,0.04387733340263367
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,64,power_law_1.01,0.040601599216461184
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,64,power_law_1.01,0.0417279988527298
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,64,power_law_1.2,0.04111360013484955
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,64,power_law_1.2,0.04177280068397522
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,8,balanced,0.07035199801127116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,8,balanced,0.07061866422494252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,8,power_law_1.01,0.06238719820976257
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,8,power_law_1.01,0.06740480065345764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,8,power_law_1.2,0.06232320070266724
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,1,8,power_law_1.2,0.06289920210838318
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,2,1,balanced,0.1778986652692159
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,2,1,balanced,0.17968000968297324
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,2,1,power_law_1.01,0.1466752052307129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,2,1,power_law_1.01,0.1489856004714966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,2,1,power_law_1.2,0.14673919677734376
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,2,1,power_law_1.2,0.1472383975982666
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,4,1,balanced,0.1123466690381368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,4,1,balanced,0.11346133550008138
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,4,1,power_law_1.01,0.09582080245018006
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,4,1,power_law_1.01,0.09719039797782898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,4,1,power_law_1.2,0.09654399752616882
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,4,1,power_law_1.2,0.0973695993423462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,8,1,balanced,0.08235733211040497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,8,1,balanced,0.08243733147780101
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,8,1,power_law_1.01,0.07389439940452576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,8,1,power_law_1.01,0.07528319954872131
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,8,1,power_law_1.2,0.07395200133323669
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,3072,1536,8,256,8,1,power_law_1.2,0.07512320280075073
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,1,balanced,0.18040533860524496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,1,balanced,0.180458664894104
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,1,power_law_1.01,0.18320640325546264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,1,power_law_1.01,0.1840127944946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,1,power_law_1.2,0.1818112015724182
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,1,power_law_1.2,0.18437119722366332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,2,balanced,0.09129599730173747
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,2,balanced,0.0953653355439504
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,2,power_law_1.01,0.10829440355300904
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,2,power_law_1.01,0.1090880036354065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,2,power_law_1.2,0.1090880036354065
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,2,power_law_1.2,0.10952320098876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,4,balanced,0.09522133072217305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,4,balanced,0.09545600414276123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,4,power_law_1.01,0.06952319741249084
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,4,power_law_1.01,0.07626879811286927
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,4,power_law_1.2,0.07780479788780212
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,4,power_law_1.2,0.07809280157089234
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,8,balanced,0.16642666856447855
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,8,balanced,0.17091200749079385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,8,power_law_1.01,0.08328319787979126
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,8,power_law_1.01,0.09088000059127807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,8,power_law_1.2,0.0807424008846283
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,1,8,power_law_1.2,0.08828799724578858
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,16,1,balanced,0.035616000493367515
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,16,1,balanced,0.03604800005753835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,16,1,power_law_1.01,0.03513599932193756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,16,1,power_law_1.01,0.03558399975299835
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,16,1,power_law_1.2,0.034176000952720643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,16,1,power_law_1.2,0.034508800506591795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,2,1,balanced,0.1002400020758311
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,2,1,balanced,0.10169066985448201
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,2,1,power_law_1.01,0.10488959550857543
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,2,1,power_law_1.01,0.10539519786834717
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,2,1,power_law_1.2,0.1033471941947937
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,2,1,power_law_1.2,0.10504319667816162
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,32,1,balanced,0.03192000091075897
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,32,1,balanced,0.03365333378314972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,32,1,power_law_1.01,0.030457600951194763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,32,1,power_law_1.01,0.032313600182533264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,32,1,power_law_1.2,0.03075839877128601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,32,1,power_law_1.2,0.03204480111598969
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,4,1,balanced,0.06834666430950165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,4,1,balanced,0.06854400038719177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,4,1,power_law_1.01,0.06676480174064636
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,4,1,power_law_1.01,0.06711680293083191
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,4,1,power_law_1.2,0.06529920101165772
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,4,1,power_law_1.2,0.0663424015045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,8,1,balanced,0.04991999765237173
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,8,1,balanced,0.050527999798456825
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,8,1,power_law_1.01,0.04848639965057373
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,8,1,power_law_1.01,0.04875519871711731
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,8,1,power_law_1.2,0.04702720046043396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,14336,2,8,8,1,power_law_1.2,0.04821760058403015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,1,balanced,0.2266133427619934
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,1,balanced,0.22801599899927774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,1,power_law_1.01,0.21765120029449464
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,1,power_law_1.01,0.21914238929748536
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,1,power_law_1.2,0.22580480575561523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,1,power_law_1.2,0.22593278884887696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,128,balanced,0.046309332052866616
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,128,balanced,0.047882666190465294
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,128,power_law_1.01,0.04279040098190308
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,128,power_law_1.01,0.04384639859199524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,128,power_law_1.2,0.0418368011713028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,128,power_law_1.2,0.04249599874019623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,16,balanced,0.060047999024391174
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,16,balanced,0.0612960010766983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,16,power_law_1.01,0.054713600873947145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,16,power_law_1.01,0.0578495979309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,16,power_law_1.2,0.053311997652053834
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,16,power_law_1.2,0.05456640124320984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,2,balanced,0.13061867157618204
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,2,balanced,0.132533331712087
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,2,power_law_1.01,0.12687360048294066
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,2,power_law_1.01,0.13068799972534179
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,2,power_law_1.2,0.12640639543533325
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,2,power_law_1.2,0.12827520370483397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,32,balanced,0.07858666777610779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,32,balanced,0.08154666423797607
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,32,power_law_1.01,0.06931840181350708
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,32,power_law_1.01,0.07459840178489685
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,32,power_law_1.2,0.0705024003982544
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,32,power_law_1.2,0.07052159905433655
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,4,balanced,0.0844106674194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,4,balanced,0.08478933572769165
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,4,power_law_1.01,0.07997440099716187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,4,power_law_1.01,0.08132479786872863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,4,power_law_1.2,0.08019840121269226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,4,power_law_1.2,0.08080000281333924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,64,balanced,0.05796800057093302
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,64,balanced,0.058149332801500954
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,64,power_law_1.01,0.05260800123214722
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,64,power_law_1.01,0.055206400156021115
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,64,power_law_1.2,0.05133439898490906
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,64,power_law_1.2,0.05249279737472534
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,8,balanced,0.06215466558933258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,8,balanced,0.06262933214505513
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,8,power_law_1.01,0.05912960171699524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,8,power_law_1.01,0.059411197900772095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,8,power_law_1.2,0.05854719877243042
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,1,8,power_law_1.2,0.05937280058860779
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,2,1,balanced,0.13357333342234293
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,2,1,balanced,0.13514133294423422
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,2,1,power_law_1.01,0.1287616014480591
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,2,1,power_law_1.01,0.12986880540847778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,2,1,power_law_1.2,0.13370239734649658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,2,1,power_law_1.2,0.13455359935760497
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,4,1,balanced,0.08674133817354839
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,4,1,balanced,0.08695466319719951
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,4,1,power_law_1.01,0.08561919927597046
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,4,1,power_law_1.01,0.08650879859924317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,4,1,power_law_1.2,0.08788480162620545
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,4,1,power_law_1.2,0.08901119828224183
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,8,1,balanced,0.0680159976085027
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,8,1,balanced,0.06814399858315785
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,8,1,power_law_1.01,0.06858879923820496
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,8,1,power_law_1.01,0.06933119893074036
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,8,1,power_law_1.2,0.06883199810981751
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,4096,1536,8,128,8,1,power_law_1.2,0.06944000124931335
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,1,balanced,0.36030399799346924
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,1,balanced,0.3621866703033447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,1,power_law_1.01,0.3515199899673462
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,1,power_law_1.01,0.3629120111465454
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,1,power_law_1.2,0.3592063903808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,1,power_law_1.2,0.362227201461792
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,2,balanced,0.13801599542299905
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,2,balanced,0.13945600390434265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,2,power_law_1.01,0.1581120014190674
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,2,power_law_1.01,0.18136320114135743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,2,power_law_1.2,0.16474239826202391
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,2,power_law_1.2,0.17320319414138793
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,4,balanced,0.11619200309117635
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,4,balanced,0.11681600411732991
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,4,power_law_1.01,0.09584640264511109
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,4,power_law_1.01,0.10181759595870972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,4,power_law_1.2,0.09657599925994872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,4,power_law_1.2,0.09799039959907532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,8,balanced,0.18529067436854044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,8,balanced,0.1914773384730021
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,8,power_law_1.01,0.09464960098266602
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,8,power_law_1.01,0.10509439706802368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,8,power_law_1.2,0.09821439981460571
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,1,8,power_law_1.2,0.10488320589065551
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,16,1,balanced,0.04604800045490265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,16,1,balanced,0.04757866760094961
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,16,1,power_law_1.01,0.043321600556373595
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,16,1,power_law_1.01,0.04426240026950836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,16,1,power_law_1.2,0.04385280013084412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,16,1,power_law_1.2,0.04517120122909546
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,2,1,balanced,0.1486240029335022
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,2,1,balanced,0.1502026617527008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,2,1,power_law_1.01,0.15720959901809692
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,2,1,power_law_1.01,0.15873279571533203
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,2,1,power_law_1.2,0.15820800065994262
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,2,1,power_law_1.2,0.15996160507202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,32,1,balanced,0.035349334279696144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,32,1,balanced,0.03572800010442734
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,32,1,power_law_1.01,0.03372800052165985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,32,1,power_law_1.01,0.03447040021419525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,32,1,power_law_1.2,0.03326080143451691
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,32,1,power_law_1.2,0.03353599905967712
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,4,1,balanced,0.09233066439628601
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,4,1,balanced,0.09265599648157756
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,4,1,power_law_1.01,0.09418240189552307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,4,1,power_law_1.01,0.0942143976688385
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,4,1,power_law_1.2,0.09462400078773499
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,4,1,power_law_1.2,0.09552000164985656
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,8,1,balanced,0.06407466530799866
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,8,1,balanced,0.06445866823196411
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,8,1,power_law_1.01,0.06136959791183472
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,8,1,power_law_1.01,0.0638592004776001
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,8,1,power_law_1.2,0.0615231990814209
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,16384,2,8,8,1,power_law_1.2,0.063155198097229
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,1,balanced,0.7815360228220621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,1,balanced,0.7834933598836263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,1,power_law_1.01,0.6213183879852295
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,1,power_law_1.01,0.6262144088745117
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,1,power_law_1.2,0.6244991779327392
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,1,power_law_1.2,0.6291327953338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,128,balanced,0.0766186664501826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,128,balanced,0.07868800063927968
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,128,power_law_1.01,0.0731328010559082
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,128,power_law_1.01,0.07425919771194459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,128,power_law_1.2,0.07198079824447631
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,128,power_law_1.2,0.07319039702415467
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,16,balanced,0.08788800239562988
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,16,balanced,0.08880533774693807
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,16,power_law_1.01,0.07415680289268493
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,16,power_law_1.01,0.07946879863739013
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,16,power_law_1.2,0.08006399869918823
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,16,power_law_1.2,0.08267520070075988
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,2,balanced,0.4100373188654582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,2,balanced,0.4105493227640788
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,2,power_law_1.01,0.3460864067077637
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,2,power_law_1.01,0.35900800228118895
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,2,power_law_1.2,0.3414144039154053
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,2,power_law_1.2,0.3472896099090576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,256,balanced,0.05850133299827576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,256,balanced,0.05855466425418854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,256,power_law_1.01,0.05408639907836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,256,power_law_1.01,0.057068800926208495
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,256,power_law_1.2,0.053958398103713986
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,256,power_law_1.2,0.05418879985809326
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,32,balanced,0.08980266253153484
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,32,balanced,0.09114666779836018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,32,power_law_1.01,0.08057600259780884
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,32,power_law_1.01,0.08399360179901123
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,32,power_law_1.2,0.07949439883232116
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,32,power_law_1.2,0.08451840281486511
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,4,balanced,0.22376533349355063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,4,balanced,0.22535467147827148
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,4,power_law_1.01,0.1892416000366211
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,4,power_law_1.01,0.19143680334091187
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,4,power_law_1.2,0.18852479457855226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,4,power_law_1.2,0.20045440196990966
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,64,balanced,0.12173333764076233
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,64,balanced,0.12270933389663696
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,64,power_law_1.01,0.10907520055770874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,64,power_law_1.01,0.11054079532623291
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,64,power_law_1.2,0.10373120307922364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,64,power_law_1.2,0.10588159561157226
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,8,balanced,0.1327893336613973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,8,balanced,0.13306666413942972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,8,power_law_1.01,0.11110399961471558
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,8,power_law_1.01,0.11875840425491332
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,8,power_law_1.2,0.11353600025177002
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,1,8,power_law_1.2,0.12223999500274658
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,16,1,balanced,0.11120532949765523
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,16,1,balanced,0.11132267117500305
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,16,1,power_law_1.01,0.10019840002059936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,16,1,power_law_1.01,0.1011199951171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,16,1,power_law_1.2,0.10029439926147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,16,1,power_law_1.2,0.10165120363235473
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,2,1,balanced,0.41274134318033856
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,2,1,balanced,0.41411733627319336
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,2,1,power_law_1.01,0.32778239250183105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,2,1,power_law_1.01,0.33758718967437745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,2,1,power_law_1.2,0.3302848100662231
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,2,1,power_law_1.2,0.33758718967437745
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,32,1,balanced,0.09106666843096416
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,32,1,balanced,0.09405866265296936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,32,1,power_law_1.01,0.08504319787025452
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,32,1,power_law_1.01,0.08581119775772095
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,32,1,power_law_1.2,0.08532480001449586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,32,1,power_law_1.2,0.08556159734725952
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,4,1,balanced,0.22815465927124023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,4,1,balanced,0.22849599520365396
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,4,1,power_law_1.01,0.1869696021080017
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,4,1,power_law_1.01,0.18929280042648317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,4,1,power_law_1.2,0.18782080411911012
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,4,1,power_law_1.2,0.189792001247406
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,8,1,balanced,0.14382400115331015
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,8,1,balanced,0.14442666371663412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,8,1,power_law_1.01,0.1264896035194397
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,8,1,power_law_1.01,0.1300927996635437
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,8,1,power_law_1.2,0.12539520263671874
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2048,8,256,8,1,power_law_1.2,0.12617599964141846
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,1,balanced,0.6210293372472128
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,1,balanced,0.6232800086339315
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,1,power_law_1.01,0.5573823928833008
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,1,power_law_1.01,0.5770304203033447
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,1,power_law_1.2,0.5763072013854981
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,1,power_law_1.2,0.5777472019195556
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,16,balanced,0.11412800351778667
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,16,balanced,0.11486933628718059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,16,power_law_1.01,0.09831039905548096
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,16,power_law_1.01,0.10009599924087524
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,16,power_law_1.2,0.09799039959907532
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,16,power_law_1.2,0.10506880283355713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,2,balanced,0.330949326356252
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,2,balanced,0.3317333261171977
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,2,power_law_1.01,0.30814080238342284
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,2,power_law_1.01,0.3122944116592407
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,2,power_law_1.2,0.30737919807434083
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,2,power_law_1.2,0.30957438945770266
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,32,balanced,0.2022506594657898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,32,balanced,0.20418665806452432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,32,power_law_1.01,0.14797439575195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,32,power_law_1.01,0.1742784023284912
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,32,power_law_1.2,0.13672319650650025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,32,power_law_1.2,0.1661120057106018
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,4,balanced,0.1851466695467631
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,4,balanced,0.18574933211008707
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,4,power_law_1.01,0.1636031985282898
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,4,power_law_1.01,0.16840319633483886
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,4,power_law_1.2,0.17056000232696533
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,4,power_law_1.2,0.17439359426498413
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,8,balanced,0.11486933628718059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,8,balanced,0.11544000109036763
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,8,power_law_1.01,0.10617599487304688
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,8,power_law_1.01,0.10914560556411743
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,8,power_law_1.2,0.10483839511871337
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,1,8,power_law_1.2,0.10853760242462158
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,2,1,balanced,0.3343786795934041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,2,1,balanced,0.3360480070114136
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,2,1,power_law_1.01,0.30161280632019044
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,2,1,power_law_1.01,0.31042559146881105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,2,1,power_law_1.2,0.3136255979537964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,2,1,power_law_1.2,0.31404800415039064
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,4,1,balanced,0.19347200791041055
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,4,1,balanced,0.19357333580652872
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,4,1,power_law_1.01,0.18094079494476317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,4,1,power_law_1.01,0.18486399650573732
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,4,1,power_law_1.2,0.18528640270233154
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,4,1,power_law_1.2,0.1869312047958374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,8,1,balanced,0.11914133032162984
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,8,1,balanced,0.11993066469828288
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,8,1,power_law_1.01,0.11533440351486206
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,8,1,power_law_1.01,0.11653120517730713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,8,1,power_law_1.2,0.11745920181274414
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,6144,2560,8,160,8,1,power_law_1.2,0.1183616042137146
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,1,balanced,0.9096159934997559
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,1,balanced,0.9104800224304199
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,1,power_law_1.01,0.7380928039550781
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,1,power_law_1.01,0.7408127784729004
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,1,power_law_1.2,0.7060031890869141
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,1,power_law_1.2,0.7355072021484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,128,balanced,0.08665066957473755
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,128,balanced,0.08962133526802063
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,128,power_law_1.01,0.07944959998130799
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,128,power_law_1.01,0.08398720026016235
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,128,power_law_1.2,0.07984640002250672
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,128,power_law_1.2,0.08171520233154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,16,balanced,0.09597333272298177
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,16,balanced,0.09710400303204854
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,16,power_law_1.01,0.08536319732666016
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,16,power_law_1.01,0.0920639991760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,16,power_law_1.2,0.08214399814605713
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,16,power_law_1.2,0.0870464026927948
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,2,balanced,0.4737813472747803
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,2,balanced,0.47403732935587567
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,2,power_law_1.01,0.37770240306854247
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,2,power_law_1.01,0.38046720027923586
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,2,power_law_1.2,0.3973632097244263
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,2,power_law_1.2,0.39819519519805907
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,256,balanced,0.06401066482067108
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,256,balanced,0.06418133278687795
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,256,power_law_1.01,0.05635200142860412
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,256,power_law_1.01,0.06325759887695312
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,256,power_law_1.2,0.05546879768371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,256,power_law_1.2,0.05692800283432007
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,32,balanced,0.09968533118565877
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,32,balanced,0.10595200459162395
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,32,power_law_1.01,0.08717439770698547
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,32,power_law_1.01,0.09503359794616699
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,32,power_law_1.2,0.0855296015739441
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,32,power_law_1.2,0.0883903980255127
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,4,balanced,0.25685866673787433
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,4,balanced,0.258245329062144
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,4,power_law_1.01,0.2129983901977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,4,power_law_1.01,0.21865599155426024
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,4,power_law_1.2,0.21224958896636964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,4,power_law_1.2,0.23189759254455566
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,64,balanced,0.1370186706384023
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,64,balanced,0.1379039982954661
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,64,power_law_1.01,0.12554240226745605
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,64,power_law_1.01,0.1271232008934021
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,64,power_law_1.2,0.11458560228347778
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,64,power_law_1.2,0.1233407974243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,8,balanced,0.14924800395965576
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,8,balanced,0.14961600303649902
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,8,power_law_1.01,0.12488960027694702
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,8,power_law_1.01,0.12825599908828736
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,8,power_law_1.2,0.12855679988861085
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,1,8,power_law_1.2,0.13477760553359985
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,16,1,balanced,0.12433600425720215
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,16,1,balanced,0.12459199627240498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,16,1,power_law_1.01,0.11335680484771729
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,16,1,power_law_1.01,0.1133952021598816
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,16,1,power_law_1.2,0.11240960359573364
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,16,1,power_law_1.2,0.1124735951423645
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,2,1,balanced,0.475600004196167
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,2,1,balanced,0.47680532932281494
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,2,1,power_law_1.01,0.37946879863739014
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,2,1,power_law_1.01,0.39288959503173826
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,2,1,power_law_1.2,0.3770751953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,2,1,power_law_1.2,0.3830591917037964
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,32,1,balanced,0.10351999600728352
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,32,1,balanced,0.10419199864069621
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,32,1,power_law_1.01,0.09433599710464477
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,32,1,power_law_1.01,0.09557120203971863
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,32,1,power_law_1.2,0.09512320160865784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,32,1,power_law_1.2,0.09580159783363343
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,4,1,balanced,0.2609813412030538
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,4,1,balanced,0.2627093394597371
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,4,1,power_law_1.01,0.2161087989807129
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,4,1,power_law_1.01,0.21936640739440919
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,4,1,power_law_1.2,0.21592319011688232
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,4,1,power_law_1.2,0.2196671962738037
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,8,1,balanced,0.16470932960510254
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,8,1,balanced,0.16501866777737936
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,8,1,power_law_1.01,0.14191999435424804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,8,1,power_law_1.01,0.14583679437637329
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,8,1,power_law_1.2,0.14306559562683105
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,256,8,1,power_law_1.2,0.145907199382782
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,1,balanced,1.3346559206644695
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,1,balanced,1.336890697479248
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,1,power_law_1.01,0.9614656448364258
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,1,power_law_1.01,0.9682815551757813
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,1,power_law_1.2,0.9404224395751953
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,1,power_law_1.2,0.942636775970459
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,128,balanced,0.10487467050552368
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,128,balanced,0.11091199517250061
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,128,power_law_1.01,0.09969279766082764
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,128,power_law_1.01,0.1041599988937378
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,128,power_law_1.2,0.10103039741516114
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,128,power_law_1.2,0.10370559692382812
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,16,balanced,0.12335466345151265
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,16,balanced,0.12350400288899739
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,16,power_law_1.01,0.09889280200004577
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,16,power_law_1.01,0.10874240398406983
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,16,power_law_1.2,0.10674560070037842
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,16,power_law_1.2,0.11324160099029541
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,2,balanced,0.6860480308532715
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,2,balanced,0.6891893545786539
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,2,power_law_1.01,0.48967680931091306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,2,power_law_1.01,0.5182591915130615
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,2,power_law_1.2,0.5202367782592774
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,2,power_law_1.2,0.53504638671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,32,balanced,0.0830080012480418
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,32,balanced,0.0832479993502299
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,32,power_law_1.01,0.07301759719848633
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,32,power_law_1.01,0.0741375982761383
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,32,power_law_1.2,0.07549440264701843
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,32,power_law_1.2,0.07630720138549804
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,4,balanced,0.36285332838694256
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,4,balanced,0.36345601081848145
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,4,power_law_1.01,0.303276801109314
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,4,power_law_1.01,0.3365760087966919
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,4,power_law_1.2,0.29998719692230225
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,4,power_law_1.2,0.309497594833374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,64,balanced,0.08861866593360901
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,64,balanced,0.08942400415738423
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,64,power_law_1.01,0.08202880024909973
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,64,power_law_1.01,0.08300799727439881
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,64,power_law_1.2,0.07738879919052125
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,64,power_law_1.2,0.08142719864845276
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,8,balanced,0.20226667324701944
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,8,balanced,0.20389332373936972
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,8,power_law_1.01,0.1713919997215271
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,8,power_law_1.01,0.17247359752655028
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,8,power_law_1.2,0.1613759994506836
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,1,8,power_law_1.2,0.19409919977188111
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,16,1,balanced,0.16454399625460306
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,16,1,balanced,0.16456000010172525
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,16,1,power_law_1.01,0.13160320520401
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,16,1,power_law_1.01,0.13411200046539307
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,16,1,power_law_1.2,0.13329919576644897
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,16,1,power_law_1.2,0.13330559730529784
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,2,1,balanced,0.6896106402079264
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,2,1,balanced,0.6905013720194498
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,2,1,power_law_1.01,0.4980160236358643
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,2,1,power_law_1.01,0.5079423904418945
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,2,1,power_law_1.2,0.483948802947998
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,2,1,power_law_1.2,0.4857024192810059
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,32,1,balanced,0.13544000188509622
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,32,1,balanced,0.1368160049120585
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,32,1,power_law_1.01,0.11084799766540528
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,32,1,power_law_1.01,0.11358720064163208
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,32,1,power_law_1.2,0.11093120574951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,32,1,power_law_1.2,0.11325440406799317
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,4,1,balanced,0.36825064818064374
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,4,1,balanced,0.36830933888753253
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,4,1,power_law_1.01,0.2788671970367432
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,4,1,power_law_1.01,0.2797823905944824
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,4,1,power_law_1.2,0.2719487905502319
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,4,1,power_law_1.2,0.273305606842041
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,8,1,balanced,0.2217173377672831
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,8,1,balanced,0.22177066405614218
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,8,1,power_law_1.01,0.17267199754714965
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,8,1,power_law_1.01,0.17415679693222047
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,8,1,power_law_1.2,0.16832640171051025
VLLM,0.19.0,NVIDIA B200,moe,vllm_flashinfer_trtllm_moe_fp4,nvfp4,96,7168,2048,8,384,8,1,power_law_1.2,0.1740031957626343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,1,balanced,0.027477333943049114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,1,balanced,0.027530667682488758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,1,power_law_1.01,0.025676798820495606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,1,power_law_1.01,0.025766399502754212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,1,power_law_1.2,0.026662400364875792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,1,power_law_1.2,0.026771199703216553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,128,balanced,0.02740799884001414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,128,balanced,0.02754133443037669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,128,power_law_1.01,0.026675200462341307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,128,power_law_1.01,0.02691200077533722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,128,power_law_1.2,0.02592639923095703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,128,power_law_1.2,0.027475199103355406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,16,balanced,0.027141332626342773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,16,balanced,0.027306665976842243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,16,power_law_1.01,0.031839999556541446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,16,power_law_1.01,0.03207040131092072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,16,power_law_1.2,0.032307198643684386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,16,power_law_1.2,0.032927998900413515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,2,balanced,0.03566933423280716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,2,balanced,0.036271999279658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,2,power_law_1.01,0.03201920092105866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,2,power_law_1.01,0.036620798707008365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,2,power_law_1.2,0.03192319869995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,2,power_law_1.2,0.03451519906520843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,32,balanced,0.027082666754722595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,32,balanced,0.029114666084448498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,32,power_law_1.01,0.026636800169944762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,32,power_law_1.01,0.027622398734092713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,32,power_law_1.2,0.027136000990867614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,32,power_law_1.2,0.02728320062160492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,4,balanced,0.02935466667016347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,4,balanced,0.0331839993596077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,4,power_law_1.01,0.03209599852561951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,4,power_law_1.01,0.0323199987411499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,4,power_law_1.2,0.0322816014289856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,4,power_law_1.2,0.03248000144958496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,64,balanced,0.02920000006755193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,64,balanced,0.02938666691382726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,64,power_law_1.01,0.02620159983634949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,64,power_law_1.01,0.026771199703216553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,64,power_law_1.2,0.02720000147819519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,64,power_law_1.2,0.027219200134277345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,8,balanced,0.027488000690937042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,8,balanced,0.02792533238728841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,8,power_law_1.01,0.031481599807739256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,8,power_law_1.01,0.03198719918727875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,8,power_law_1.2,0.03155199885368347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,1,8,power_law_1.2,0.032179200649261476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,2,1,balanced,0.021509334444999695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,2,1,balanced,0.022986667851607006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,2,1,power_law_1.01,0.02088959962129593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,2,1,power_law_1.01,0.024108800292015075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,2,1,power_law_1.2,0.020902399718761445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,2,1,power_law_1.2,0.0211776003241539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,4,1,balanced,0.023077333966890972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,4,1,balanced,0.023221333821614582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,4,1,power_law_1.01,0.020479999482631683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,4,1,power_law_1.01,0.020883199572563172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,4,1,power_law_1.2,0.020479999482631683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2048,768,8,128,4,1,power_law_1.2,0.020768000185489653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,1,balanced,0.047872001926104225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,1,balanced,0.048170665899912514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,1,power_law_1.01,0.04671359956264496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,1,power_law_1.01,0.046828800439834596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,1,power_law_1.2,0.0455808013677597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,1,power_law_1.2,0.04644480049610138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,128,balanced,0.03160533308982849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,128,balanced,0.03329066683848699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,128,power_law_1.01,0.030707201361656188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,128,power_law_1.01,0.031052801012992858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,128,power_law_1.2,0.031615999341011045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,128,power_law_1.2,0.03203839957714081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,16,balanced,0.03339199970165888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,16,balanced,0.0335359995563825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,16,power_law_1.01,0.052985602617263795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,16,power_law_1.01,0.05348479747772217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,16,power_law_1.2,0.05214080214500427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,16,power_law_1.2,0.0523967981338501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,2,balanced,0.03756800045569738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,2,balanced,0.039477333426475525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,2,power_law_1.01,0.052179199457168576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,2,power_law_1.01,0.05258240103721619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,2,power_law_1.2,0.05240319967269898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,2,power_law_1.2,0.05338240265846252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,32,balanced,0.03347733368476232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,32,balanced,0.03356266766786575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,32,power_law_1.01,0.044844800233840944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,32,power_law_1.01,0.045388799905776975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,32,power_law_1.2,0.04604159891605377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,32,power_law_1.2,0.04616959989070892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,4,balanced,0.03721600025892258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,4,balanced,0.037471999724706016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,4,power_law_1.01,0.052147197723388675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,4,power_law_1.01,0.05281919836997986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,4,power_law_1.2,0.05221760272979736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,4,power_law_1.2,0.053299200534820554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,64,balanced,0.033088001112143196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,64,balanced,0.033514666060606636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,64,power_law_1.01,0.035046398639678955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,64,power_law_1.01,0.03506560027599335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,64,power_law_1.2,0.0353408008813858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,64,power_law_1.2,0.035846400260925296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,8,balanced,0.03145066648721695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,8,balanced,0.033200000723203026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,8,power_law_1.01,0.05170559883117676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,8,power_law_1.01,0.05261440277099609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,8,power_law_1.2,0.052095997333526614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,1,8,power_law_1.2,0.052198398113250735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,16,1,balanced,0.02737066646416982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,16,1,balanced,0.02749866743882497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,16,1,power_law_1.01,0.026598399877548216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,16,1,power_law_1.01,0.026630398631095887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,16,1,power_law_1.2,0.026649600267410277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,16,1,power_law_1.2,0.026956799626350402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,2,1,balanced,0.03129599988460541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,2,1,balanced,0.03235200047492981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,2,1,power_law_1.01,0.030502399802207945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,2,1,power_law_1.01,0.03091199994087219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,2,1,power_law_1.2,0.030393600463867188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,2,1,power_law_1.2,0.03084160089492798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,32,1,balanced,0.029359998802344005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,32,1,balanced,0.029370665550231934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,32,1,power_law_1.01,0.02632960081100464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,32,1,power_law_1.01,0.026572799682617186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,32,1,power_law_1.2,0.026419198513031004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,32,1,power_law_1.2,0.026739200949668883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,4,1,balanced,0.02510400116443634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,4,1,balanced,0.02513599892457326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,4,1,power_law_1.01,0.023526400327682495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,4,1,power_law_1.01,0.023558400571346283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,4,1,power_law_1.2,0.02311040014028549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,4,1,power_law_1.2,0.023340800404548646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,8,1,balanced,0.031498665610949196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,8,1,balanced,0.0315786674618721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,8,1,power_law_1.01,0.02961280047893524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,8,1,power_law_1.01,0.029657599329948426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,8,1,power_law_1.2,0.029094401001930236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,2688,1856,6,128,8,1,power_law_1.2,0.02945919930934906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,1,balanced,0.05761066575845083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,1,balanced,0.060165335734685264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,1,power_law_1.01,0.053881597518920896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,1,power_law_1.01,0.05619199872016907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,1,power_law_1.2,0.05651199817657471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,1,power_law_1.2,0.05989120006561279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,128,balanced,0.03312533348798752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,128,balanced,0.03334933271010717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,128,power_law_1.01,0.03198719918727875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,128,power_law_1.01,0.03219200074672699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,128,power_law_1.2,0.03162879943847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,128,power_law_1.2,0.03199360072612763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,16,balanced,0.03145600110292435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,16,balanced,0.033226666351159416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,16,power_law_1.01,0.058457601070404056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,16,power_law_1.01,0.05971840023994446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,16,power_law_1.2,0.05923839807510376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,16,power_law_1.2,0.059334397315979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,2,balanced,0.04750399788220724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,2,balanced,0.04786666731039683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,2,power_law_1.01,0.05990399718284607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,2,power_law_1.01,0.06222720146179199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,2,power_law_1.2,0.05989760160446167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,2,power_law_1.2,0.060172802209854125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,256,balanced,0.033258666594823204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,256,balanced,0.03365866591533025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,256,power_law_1.01,0.03079040050506592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,256,power_law_1.01,0.031200000643730165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,256,power_law_1.2,0.03132160007953644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,256,power_law_1.2,0.031916800141334536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,32,balanced,0.03225066761175791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,32,balanced,0.03345600018898646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,32,power_law_1.01,0.0603007972240448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,32,power_law_1.01,0.06035199761390686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,32,power_law_1.2,0.05911039710044861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,32,power_law_1.2,0.05973759889602661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,4,balanced,0.03724266588687897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,4,balanced,0.0374293327331543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,4,power_law_1.01,0.05899519920349121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,4,power_law_1.01,0.05914239883422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,4,power_law_1.2,0.0593280017375946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,4,power_law_1.2,0.05975040197372437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,64,balanced,0.03223466624816259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,64,balanced,0.033370666205883026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,64,power_law_1.01,0.04519039988517761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,64,power_law_1.01,0.0466623991727829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,64,power_law_1.2,0.04580479860305786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,64,power_law_1.2,0.046911999583244324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,8,balanced,0.033413333197434746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,8,balanced,0.033717334270477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,8,power_law_1.01,0.05934079885482788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,8,power_law_1.01,0.06023039817810059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,8,power_law_1.2,0.05849599838256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,1,8,power_law_1.2,0.0591871976852417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,16,1,balanced,0.023178666830062866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,16,1,balanced,0.023232000569502514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,16,1,power_law_1.01,0.022252799570560457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,16,1,power_law_1.01,0.022355200350284578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,16,1,power_law_1.2,0.022438399493694305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,16,1,power_law_1.2,0.02248319983482361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,2,1,balanced,0.03531199942032496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,2,1,balanced,0.03734933336575826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,2,1,power_law_1.01,0.03689599931240082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,2,1,power_law_1.01,0.03729279935359955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,2,1,power_law_1.2,0.03678080141544342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,2,1,power_law_1.2,0.03763839900493622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,32,1,balanced,0.02333866556485494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,32,1,balanced,0.023552000522613525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,32,1,power_law_1.01,0.02210559993982315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,32,1,power_law_1.01,0.023052799701690673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,32,1,power_law_1.2,0.021516799926757812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,32,1,power_law_1.2,0.02194560021162033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,4,1,balanced,0.026159999271233875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,4,1,balanced,0.026869334280490875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,4,1,power_law_1.01,0.02451840043067932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,4,1,power_law_1.01,0.02504960000514984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,4,1,power_law_1.2,0.024556800723075867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,4,1,power_law_1.2,0.02476159930229187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,8,1,balanced,0.02510400116443634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,8,1,balanced,0.02553066611289978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,8,1,power_law_1.01,0.023628799617290495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,8,1,power_law_1.01,0.024153600633144378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,8,1,power_law_1.2,0.0237184002995491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,3072,1536,8,256,8,1,power_law_1.2,0.023839999735355378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,1,balanced,0.13990933696428934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,1,balanced,0.1399786671002706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,1,power_law_1.01,0.13957120180130006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,1,power_law_1.01,0.14031360149383545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,1,power_law_1.2,0.14073599576950074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,1,power_law_1.2,0.14134399890899657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,2,balanced,0.11038933197657268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,2,balanced,0.11130133271217346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,2,power_law_1.01,0.12333439588546753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,2,power_law_1.01,0.1347648024559021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,2,power_law_1.2,0.12432639598846436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,2,power_law_1.2,0.14368640184402465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,4,balanced,0.1251253286997477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,4,balanced,0.12669333815574646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,4,power_law_1.01,0.11143039464950562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,4,power_law_1.01,0.12362879514694214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,4,power_law_1.2,0.10835839509963989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,4,power_law_1.2,0.1094655990600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,8,balanced,0.11524800459543864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,8,balanced,0.11948266625404358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,8,power_law_1.01,0.1072767972946167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,8,power_law_1.01,0.10844160318374634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,8,power_law_1.2,0.10716160535812377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,1,8,power_law_1.2,0.11041920185089112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,16,1,balanced,0.02735466758410136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,16,1,balanced,0.027637332677841187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,16,1,power_law_1.01,0.029260799288749695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,16,1,power_law_1.01,0.02933120131492615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,16,1,power_law_1.2,0.02661119997501373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,16,1,power_law_1.2,0.029504001140594482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,2,1,balanced,0.08418666323026021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,2,1,balanced,0.08957333366076152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,2,1,power_law_1.01,0.08473600149154663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,2,1,power_law_1.01,0.08725119829177856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,2,1,power_law_1.2,0.08346880078315735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,2,1,power_law_1.2,0.09236479997634887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,32,1,balanced,0.025040000677108765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,32,1,balanced,0.027301333844661713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,32,1,power_law_1.01,0.024153600633144378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,32,1,power_law_1.01,0.02449920028448105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,32,1,power_law_1.2,0.024326400458812715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,32,1,power_law_1.2,0.024556800723075867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,4,1,balanced,0.04897599915663401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,4,1,balanced,0.06750399867693584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,4,1,power_law_1.01,0.04901759922504425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,4,1,power_law_1.01,0.049158400297164916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,4,1,power_law_1.2,0.04907520115375519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,4,1,power_law_1.2,0.0535103976726532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,8,1,balanced,0.03761066744724909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,8,1,balanced,0.03955733279387156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,8,1,power_law_1.01,0.03406080007553101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,8,1,power_law_1.01,0.03426559865474701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,8,1,power_law_1.2,0.034585601091384886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,14336,2,8,8,1,power_law_1.2,0.036735999584198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,1,balanced,0.07284266750017802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,1,balanced,0.07421866556008656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,1,power_law_1.01,0.07061120271682739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,1,power_law_1.01,0.07064319849014282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,1,power_law_1.2,0.06809599995613098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,1,power_law_1.2,0.06991360187530518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,128,balanced,0.035317334036032356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,128,balanced,0.03565866748491923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,128,power_law_1.01,0.03312000036239624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,128,power_law_1.01,0.03375360071659088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,128,power_law_1.2,0.03402880132198334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,128,power_law_1.2,0.03404799997806549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,16,balanced,0.03533333291610082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,16,balanced,0.03557866563399633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,16,power_law_1.01,0.07495679855346679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,16,power_law_1.01,0.07622399926185608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,16,power_law_1.2,0.06835839748382569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,16,power_law_1.2,0.07586560249328614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,2,balanced,0.05569066603978475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,2,balanced,0.056559999783833824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,2,power_law_1.01,0.07548800110816956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,2,power_law_1.01,0.07592319846153259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,2,power_law_1.2,0.07331200242042542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,2,power_law_1.2,0.0775168001651764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,32,balanced,0.03533866753180822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,32,balanced,0.03542399903138479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,32,power_law_1.01,0.05308160185813904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,32,power_law_1.01,0.05400959849357605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,32,power_law_1.2,0.05231999754905701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,32,power_law_1.2,0.052985602617263795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,4,balanced,0.03847466657559077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,4,balanced,0.03937600056330363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,4,power_law_1.01,0.07618560194969178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,4,power_law_1.01,0.07704960107803345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,4,power_law_1.2,0.07406719923019409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,4,power_law_1.2,0.07587839961051941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,64,balanced,0.03562666724125544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,64,balanced,0.03569599986076355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,64,power_law_1.01,0.03678080141544342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,64,power_law_1.01,0.037324801087379456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,64,power_law_1.2,0.03669120073318481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,64,power_law_1.2,0.037324801087379456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,8,balanced,0.03558400024970373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,8,balanced,0.03562133262554804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,8,power_law_1.01,0.0752128005027771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,8,power_law_1.01,0.07598080039024353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,8,power_law_1.2,0.07323520183563233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,1,8,power_law_1.2,0.07640960216522216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,16,1,balanced,0.029322666426499683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,16,1,balanced,0.030613332986831665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,16,1,power_law_1.01,0.028191998600959778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,16,1,power_law_1.01,0.028224000334739686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,16,1,power_law_1.2,0.027596798539161683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,16,1,power_law_1.2,0.028230398893356323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,2,1,balanced,0.04781866570313772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,2,1,balanced,0.04788800080617269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,2,1,power_law_1.01,0.045561599731445315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,2,1,power_law_1.01,0.04557439982891083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,2,1,power_law_1.2,0.04513919949531555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,2,1,power_law_1.2,0.04567680060863495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,32,1,balanced,0.02887466549873352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,32,1,balanced,0.029306667546431225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,32,1,power_law_1.01,0.027871999144554137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,32,1,power_law_1.01,0.02791680097579956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,32,1,power_law_1.2,0.027481600642204285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,32,1,power_law_1.2,0.027987200021743774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,4,1,balanced,0.03369600077470144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,4,1,balanced,0.03543466577927271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,4,1,power_law_1.01,0.030188798904418945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,4,1,power_law_1.01,0.030316799879074097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,4,1,power_law_1.2,0.03128319978713989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,4,1,power_law_1.2,0.033081600069999696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,8,1,balanced,0.031311998764673867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,8,1,balanced,0.03235200047492981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,8,1,power_law_1.01,0.030054399371147157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,8,1,power_law_1.01,0.030297601222991945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,8,1,power_law_1.2,0.030342400074005127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,1536,8,128,8,1,power_law_1.2,0.030393600463867188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,1,balanced,0.24650132656097412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,1,balanced,0.2485439976056417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,1,power_law_1.01,0.24689919948577882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,1,power_law_1.01,0.2487936019897461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,1,power_law_1.2,0.24792320728302003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,1,power_law_1.2,0.2480704069137573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,128,balanced,0.041637333730856575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,128,balanced,0.04179200033346812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,128,power_law_1.01,0.07199360132217407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,128,power_law_1.01,0.07297279834747314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,128,power_law_1.2,0.07173759937286377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,128,power_law_1.2,0.0720255970954895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,16,balanced,0.05593599875768026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,16,balanced,0.06015466650327047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,16,power_law_1.01,0.25271680355072024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,16,power_law_1.01,0.25319681167602537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,16,power_law_1.2,0.25496320724487304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,16,power_law_1.2,0.257587194442749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,2,balanced,0.14920000235239664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,2,balanced,0.14960533380508423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,2,power_law_1.01,0.25564799308776853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,2,power_law_1.01,0.256825590133667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,2,power_law_1.2,0.2565056085586548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,2,power_law_1.2,0.26060800552368163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,256,balanced,0.04147200038035711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,256,balanced,0.041797334949175514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,256,power_law_1.01,0.05494400262832642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,256,power_law_1.01,0.055103999376296994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,256,power_law_1.2,0.055980801582336426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,256,power_law_1.2,0.05605120062828064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,32,balanced,0.03962666789690653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,32,balanced,0.04165333261092504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,32,power_law_1.01,0.19774719476699829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,32,power_law_1.01,0.19805439710617065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,32,power_law_1.2,0.19615999460220337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,32,power_law_1.2,0.1977728009223938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,4,balanced,0.09874666730562846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,4,balanced,0.09980266292889912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,4,power_law_1.01,0.2527551889419556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,4,power_law_1.01,0.2543423891067505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,4,power_law_1.2,0.25345919132232664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,4,power_law_1.2,0.25396480560302737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,64,balanced,0.041589332123597465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,64,balanced,0.041802664597829185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,64,power_law_1.01,0.1173632025718689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,64,power_law_1.01,0.11800320148468017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,64,power_law_1.2,0.11786240339279175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,64,power_law_1.2,0.12044800519943237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,8,balanced,0.06402666866779327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,8,balanced,0.0664160003264745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,8,power_law_1.01,0.25207679271697997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,8,power_law_1.01,0.2533695936203003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,8,power_law_1.2,0.2543936014175415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,1,8,power_law_1.2,0.256499195098877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,16,1,balanced,0.08202133576075236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,16,1,balanced,0.08243200182914734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,16,1,power_law_1.01,0.07313920259475708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,16,1,power_law_1.01,0.07326080203056336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,16,1,power_law_1.2,0.07246720194816589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,16,1,power_law_1.2,0.07294080257415772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,2,1,balanced,0.1395146648089091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,2,1,balanced,0.1427893340587616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,2,1,power_law_1.01,0.1336192011833191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,2,1,power_law_1.01,0.13426560163497925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,2,1,power_law_1.2,0.13208320140838622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,2,1,power_law_1.2,0.1368384003639221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,32,1,balanced,0.061994666854540505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,32,1,balanced,0.06215466558933258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,32,1,power_law_1.01,0.05912320017814636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,32,1,power_law_1.01,0.059910398721694944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,32,1,power_law_1.2,0.05958399772644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,32,1,power_law_1.2,0.05978879928588867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,4,1,balanced,0.09976533055305481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,4,1,balanced,0.1019040048122406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,4,1,power_law_1.01,0.08773120045661927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,4,1,power_law_1.01,0.0877568006515503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,4,1,power_law_1.2,0.08531839847564697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,4,1,power_law_1.2,0.08700159788131714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,8,1,balanced,0.05815466741720835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,8,1,balanced,0.06417066852251689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,8,1,power_law_1.01,0.055155199766159055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,8,1,power_law_1.01,0.06104320287704468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,8,1,power_law_1.2,0.05586559772491455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,4096,2688,22,512,8,1,power_law_1.2,0.05687040090560913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,1,balanced,0.21772799889246622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,1,balanced,0.2465226650238037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,1,power_law_1.01,0.2585024118423462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,1,power_law_1.01,0.26347520351409914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,1,power_law_1.2,0.21845760345458984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,1,power_law_1.2,0.23965439796447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,2,balanced,0.15030399958292642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,2,balanced,0.17537067333857217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,2,power_law_1.01,0.1645311951637268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,2,power_law_1.01,0.16637439727783204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,2,power_law_1.2,0.18523520231246948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,2,power_law_1.2,0.21099519729614258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,4,balanced,0.1532639960447947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,4,balanced,0.15340266625086466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,4,power_law_1.01,0.147871994972229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,4,power_law_1.01,0.1615231990814209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,4,power_law_1.2,0.1804479956626892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,4,power_law_1.2,0.20972158908843994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,8,balanced,0.14881599942843118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,8,balanced,0.1516320010026296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,8,power_law_1.01,0.14962559938430786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,8,power_law_1.01,0.14992640018463135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,8,power_law_1.2,0.1476415991783142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,1,8,power_law_1.2,0.14793599843978883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,16,1,balanced,0.03551466763019562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,16,1,balanced,0.03566399961709976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,16,1,power_law_1.01,0.03866879940032959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,16,1,power_law_1.01,0.038867199420928956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,16,1,power_law_1.2,0.03824639916419983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,16,1,power_law_1.2,0.03888640105724335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,2,1,balanced,0.1316480040550232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,2,1,balanced,0.15229866902033487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,2,1,power_law_1.01,0.12669440507888793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,2,1,power_law_1.01,0.14256639480590821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,2,1,power_law_1.2,0.13006720542907715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,2,1,power_law_1.2,0.14742399454116822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,32,1,balanced,0.0332640012105306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,32,1,balanced,0.03339733431736628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,32,1,power_law_1.01,0.03188480138778686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,32,1,power_law_1.01,0.03221760094165802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,32,1,power_law_1.2,0.03304960131645203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,32,1,power_law_1.2,0.03311359882354736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,4,1,balanced,0.06946666538715363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,4,1,balanced,0.07746666669845581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,4,1,power_law_1.01,0.06743680238723755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,4,1,power_law_1.01,0.06780160069465638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,4,1,power_law_1.2,0.073580801486969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,4,1,power_law_1.2,0.07482879757881164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,8,1,balanced,0.048298666874567665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,8,1,balanced,0.05609600245952606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,8,1,power_law_1.01,0.046777600049972536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,8,1,power_law_1.01,0.04699519872665405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,8,1,power_law_1.2,0.050361597537994386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,16384,2,8,8,1,power_law_1.2,0.05375360250473023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,1,balanced,0.12849600116411844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,1,balanced,0.1451573371887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,1,power_law_1.01,0.12805119752883912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,1,power_law_1.01,0.12940800189971924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,1,power_law_1.2,0.125491201877594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,1,power_law_1.2,0.12816640138626098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,128,balanced,0.04187199970086416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,128,balanced,0.042021334171295166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,128,power_law_1.01,0.058822399377822875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,128,power_law_1.01,0.05894399881362915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,128,power_law_1.2,0.058195197582244874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,128,power_law_1.2,0.058380800485610965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,16,balanced,0.04342933495839437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,16,balanced,0.04374399781227112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,16,power_law_1.01,0.13017599582672118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,16,power_law_1.01,0.13033599853515626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,16,power_law_1.2,0.1310528039932251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,16,power_law_1.2,0.1314560055732727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,2,balanced,0.07669866581757863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,2,balanced,0.07744533320267995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,2,power_law_1.01,0.1315775990486145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,2,power_law_1.01,0.13315199613571166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,2,power_law_1.2,0.12928639650344848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,2,power_law_1.2,0.13251199722290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,256,balanced,0.04340800146261851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,256,balanced,0.04372799893220266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,256,power_law_1.01,0.040601599216461184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,256,power_law_1.01,0.04119040071964264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,256,power_law_1.2,0.04058879911899567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,256,power_law_1.2,0.040863999724388124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,32,balanced,0.04374399781227112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,32,balanced,0.04377600053946177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,32,power_law_1.01,0.1304255962371826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,32,power_law_1.01,0.1323583960533142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,32,power_law_1.2,0.128601598739624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,32,power_law_1.2,0.13080320358276368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,4,balanced,0.06071466704209646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,4,balanced,0.06126933296521505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,4,power_law_1.01,0.12865279912948607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,4,power_law_1.01,0.13351039886474608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,4,power_law_1.2,0.1307711958885193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,4,power_law_1.2,0.13426560163497925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,64,balanced,0.043935999274253845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,64,balanced,0.04562666515509287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,64,power_law_1.01,0.07388160228729249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,64,power_law_1.01,0.07489280104637146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,64,power_law_1.2,0.0737600028514862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,64,power_law_1.2,0.07516160011291503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,8,balanced,0.04154133299986521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,8,balanced,0.04292266567548116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,8,power_law_1.01,0.13299200534820557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,8,power_law_1.01,0.1331455945968628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,8,power_law_1.2,0.127948796749115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,1,8,power_law_1.2,0.1305791974067688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,16,1,balanced,0.03554133325815201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,16,1,balanced,0.03620799879233042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,16,1,power_law_1.01,0.03333120048046112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,16,1,power_law_1.01,0.03364480137825012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,16,1,power_law_1.2,0.033606401085853575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,16,1,power_law_1.2,0.03386240005493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,2,1,balanced,0.06925333539644878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,2,1,balanced,0.07020266850789388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,2,1,power_law_1.01,0.07095680236816407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,2,1,power_law_1.01,0.07616000175476074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,2,1,power_law_1.2,0.06696959733963012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,2,1,power_law_1.2,0.06838399767875672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,32,1,balanced,0.03350933392842611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,32,1,balanced,0.03538133452335993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,32,1,power_law_1.01,0.03288320004940033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,32,1,power_law_1.01,0.03335039913654327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,32,1,power_law_1.2,0.03283199965953827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,32,1,power_law_1.2,0.03317759931087494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,4,1,balanced,0.04869333406289419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,4,1,balanced,0.049957334995269775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,4,1,power_law_1.01,0.04894720017910004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,4,1,power_law_1.01,0.054502397775650024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,4,1,power_law_1.2,0.04784640073776245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,4,1,power_law_1.2,0.04945279955863953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,8,1,balanced,0.0394400010506312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,8,1,balanced,0.03968533376852671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,8,1,power_law_1.01,0.03559040129184723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,8,1,power_law_1.01,0.038553598523139956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,8,1,power_law_1.2,0.03513599932193756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2048,8,256,8,1,power_law_1.2,0.035308799147605895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,1,balanced,0.13952533404032388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,1,balanced,0.13985066612561545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,1,power_law_1.01,0.1384703993797302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,1,power_law_1.01,0.13992320299148558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,1,power_law_1.2,0.13759360313415528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,1,power_law_1.2,0.1480512022972107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,16,balanced,0.04587199787298838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,16,balanced,0.04791999856630961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,16,power_law_1.01,0.1438655972480774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,16,power_law_1.01,0.1445248007774353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,16,power_law_1.2,0.14495359659194945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,16,power_law_1.2,0.1450816035270691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,2,balanced,0.08553600311279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,2,balanced,0.08665066957473755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,2,power_law_1.01,0.1441215991973877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,2,power_law_1.01,0.14793599843978883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,2,power_law_1.2,0.14508800506591796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,2,power_law_1.2,0.15219839811325073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,32,balanced,0.047600001096725464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,32,balanced,0.04969066878159841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,32,power_law_1.01,0.10362880229949951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,32,power_law_1.01,0.10404479503631592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,32,power_law_1.2,0.10232959985733033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,32,power_law_1.2,0.1030784010887146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,4,balanced,0.0624533345301946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,4,balanced,0.06379733482996623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,4,power_law_1.01,0.14384640455245973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,4,power_law_1.01,0.14570879936218262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,4,power_law_1.2,0.14416639804840087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,4,power_law_1.2,0.15016959905624389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,8,balanced,0.0476746658484141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,8,balanced,0.04784533381462097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,8,power_law_1.01,0.14470399618148805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,8,power_law_1.01,0.14534399509429932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,8,power_law_1.2,0.14435839653015137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,1,8,power_law_1.2,0.14574079513549804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,16,1,balanced,0.03737066686153412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,16,1,balanced,0.03761066744724909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,16,1,power_law_1.01,0.035206401348114015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,16,1,power_law_1.01,0.035257598757743834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,16,1,power_law_1.2,0.03516800105571747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,16,1,power_law_1.2,0.0354559987783432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,2,1,balanced,0.07865599791208903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,2,1,balanced,0.08041066428025563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,2,1,power_law_1.01,0.07764480113983155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,2,1,power_law_1.01,0.09258239865303039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,2,1,power_law_1.2,0.08112639784812928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,2,1,power_law_1.2,0.08663679957389832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,32,1,balanced,0.035455999275048576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,32,1,balanced,0.03561066587766012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,32,1,power_law_1.01,0.0332863986492157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,32,1,power_law_1.01,0.03361279964447021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,32,1,power_law_1.2,0.03318400084972382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,32,1,power_law_1.2,0.033529600501060484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,4,1,balanced,0.05909866591294607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,4,1,balanced,0.06306133170922597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,4,1,power_law_1.01,0.05449600219726562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,4,1,power_law_1.01,0.054681599140167236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,4,1,power_law_1.2,0.0538752019405365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,4,1,power_law_1.2,0.05633919835090637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,8,1,balanced,0.04142399877309799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,8,1,balanced,0.04159466673930486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,8,1,power_law_1.01,0.04007680118083954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,8,1,power_law_1.01,0.040729600191116336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,8,1,power_law_1.2,0.044972801208496095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,6144,2560,8,160,8,1,power_law_1.2,0.045311999320983884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,1,balanced,0.1418239971001943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,1,balanced,0.14850667119026184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,1,power_law_1.01,0.1442752003669739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,1,power_law_1.01,0.14526720046997071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,1,power_law_1.2,0.14309120178222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,1,power_law_1.2,0.1458624005317688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,128,balanced,0.048767998814582825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,128,balanced,0.05407999952634176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,128,power_law_1.01,0.06232960224151611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,128,power_law_1.01,0.06276479959487916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,128,power_law_1.2,0.06232320070266724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,128,power_law_1.2,0.06270080208778381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,16,balanced,0.0480373352766037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,16,balanced,0.05163733164469401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,16,power_law_1.01,0.14988160133361816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,16,power_law_1.01,0.15133440494537354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,16,power_law_1.2,0.15441919565200807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,16,power_law_1.2,0.15556479692459108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,2,balanced,0.08823466300964355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,2,balanced,0.0902239978313446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,2,power_law_1.01,0.15111680030822755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,2,power_law_1.01,0.15324800014495848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,2,power_law_1.2,0.15199999809265136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,2,power_law_1.2,0.1522304058074951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,256,balanced,0.051642666260401406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,256,balanced,0.056128000219662987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,256,power_law_1.01,0.04855040013790131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,256,power_law_1.01,0.048767998814582825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,256,power_law_1.2,0.04883840084075928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,256,power_law_1.2,0.049830400943756105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,32,balanced,0.051925331354141235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,32,balanced,0.052095999320348106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,32,power_law_1.01,0.15234559774398804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,32,power_law_1.01,0.15247360467910767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,32,power_law_1.2,0.15267200469970704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,32,power_law_1.2,0.15418239831924438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,4,balanced,0.06381866832574208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,4,balanced,0.06623466809590657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,4,power_law_1.01,0.15320320129394532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,4,power_law_1.01,0.15493119955062867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,4,power_law_1.2,0.15523840188980104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,4,power_law_1.2,0.1586303949356079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,64,balanced,0.05374933282534281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,64,balanced,0.053946668903032936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,64,power_law_1.01,0.08654080033302307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,64,power_law_1.01,0.08764799833297729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,64,power_law_1.2,0.08698239922523499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,64,power_law_1.2,0.08830080032348633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,8,balanced,0.04994133114814758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,8,balanced,0.059861332178115845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,8,power_law_1.01,0.14965120553970337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,8,power_law_1.01,0.1527168035507202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,8,power_law_1.2,0.15032960176467897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,1,8,power_law_1.2,0.15550719499588012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,16,1,balanced,0.03972800076007843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,16,1,balanced,0.03977066775163015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,16,1,power_law_1.01,0.03777279853820801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,16,1,power_law_1.01,0.03809280097484589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,16,1,power_law_1.2,0.03777279853820801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,16,1,power_law_1.2,0.03793280124664307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,2,1,balanced,0.07711466650168101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,2,1,balanced,0.08261866867542267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,2,1,power_law_1.01,0.08783360123634339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,2,1,power_law_1.01,0.08946560025215149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,2,1,power_law_1.2,0.07602559924125671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,2,1,power_law_1.2,0.07864959836006165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,32,1,balanced,0.038362666964530945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,32,1,balanced,0.03976000100374222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,32,1,power_law_1.01,0.03701759874820709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,32,1,power_law_1.01,0.03720319867134094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,32,1,power_law_1.2,0.037599998712539676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,32,1,power_law_1.2,0.03763200044631958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,4,1,balanced,0.05608533322811127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,4,1,balanced,0.059119999408721924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,4,1,power_law_1.01,0.05379840135574341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,4,1,power_law_1.01,0.054201602935791016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,4,1,power_law_1.2,0.05445759892463684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,4,1,power_law_1.2,0.055302399396896365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,8,1,balanced,0.044480000933011375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,8,1,balanced,0.04548266530036926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,8,1,power_law_1.01,0.048441600799560544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,8,1,power_law_1.01,0.05025920271873474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,8,1,power_law_1.2,0.04224640130996704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,256,8,1,power_law_1.2,0.04430719912052154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,1,balanced,0.14346667130788168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,1,balanced,0.14892266194025675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,1,power_law_1.01,0.1447424054145813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,1,power_law_1.01,0.14476159811019898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,1,power_law_1.2,0.14549119472503663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,1,power_law_1.2,0.14595199823379518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,128,balanced,0.04981866478919983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,128,balanced,0.05189333359400431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,128,power_law_1.01,0.0688704013824463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,128,power_law_1.01,0.06903679966926575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,128,power_law_1.2,0.0681984007358551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,128,power_law_1.2,0.06910719871520996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,16,balanced,0.04923200110594431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,16,balanced,0.050101334849993386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,16,power_law_1.01,0.15084160566329957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,16,power_law_1.01,0.15349119901657104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,16,power_law_1.2,0.14988160133361816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,16,power_law_1.2,0.15263359546661376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,2,balanced,0.09120532870292664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,2,balanced,0.10539199908574422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,2,power_law_1.01,0.15215359926223754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,2,power_law_1.01,0.16325119733810425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,2,power_law_1.2,0.15430400371551514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,2,power_law_1.2,0.15828479528427125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,32,balanced,0.049813335140546165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,32,balanced,0.05165866514046987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,32,power_law_1.01,0.15371520519256593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,32,power_law_1.01,0.15594880580902098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,32,power_law_1.2,0.15287040472030639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,32,power_law_1.2,0.15400320291519165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,4,balanced,0.06437333424886067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,4,balanced,0.06549866497516632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,4,power_law_1.01,0.15360000133514404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,4,power_law_1.01,0.1559231996536255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,4,power_law_1.2,0.14739199876785278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,4,power_law_1.2,0.15348479747772217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,64,balanced,0.049925332268079124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,64,balanced,0.051872000098228455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,64,power_law_1.01,0.1071679949760437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,64,power_law_1.01,0.10730240345001221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,64,power_law_1.2,0.10656640529632569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,64,power_law_1.2,0.10699520111083985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,8,balanced,0.05000533163547516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,8,balanced,0.052000001072883606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,8,power_law_1.01,0.15274239778518678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,8,power_law_1.01,0.15441279411315917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,8,power_law_1.2,0.149017596244812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,1,8,power_law_1.2,0.15202560424804687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,16,1,balanced,0.03948266555865606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,16,1,balanced,0.039647998909155525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,16,1,power_law_1.01,0.03733119964599609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,16,1,power_law_1.01,0.03751679956912994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,16,1,power_law_1.2,0.03726080060005188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,16,1,power_law_1.2,0.03805440068244934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,2,1,balanced,0.07750933369000752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,2,1,balanced,0.07795199751853943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,2,1,power_law_1.01,0.07581440210342408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,2,1,power_law_1.01,0.07679359912872315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,2,1,power_law_1.2,0.0753216028213501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,2,1,power_law_1.2,0.07623680233955384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,32,1,balanced,0.03807999938726425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,32,1,balanced,0.03949866692225138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,32,1,power_law_1.01,0.037190398573875426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,32,1,power_law_1.01,0.03740800023078918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,32,1,power_law_1.2,0.037049600481987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,32,1,power_law_1.2,0.03768320083618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,4,1,balanced,0.05414933462937673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,4,1,balanced,0.06117866436640421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,4,1,power_law_1.01,0.05319679975509643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,4,1,power_law_1.01,0.053958398103713986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,4,1,power_law_1.2,0.054048001766204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,4,1,power_law_1.2,0.0541055977344513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,8,1,balanced,0.04493333399295807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,8,1,balanced,0.04563733438650767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,8,1,power_law_1.01,0.042796799540519716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,8,1,power_law_1.01,0.043270400166511534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,8,1,power_law_1.2,0.0416703999042511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1,7168,2048,8,384,8,1,power_law_1.2,0.042368000745773314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,1,balanced,0.2694026629130046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,1,balanced,0.2704319953918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,1,power_law_1.01,0.3056895971298218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,1,power_law_1.01,0.3083264112472534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,1,power_law_1.2,0.3176127910614014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,1,power_law_1.2,0.3185920000076294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,128,balanced,0.0807360013326009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,128,balanced,0.08291199803352356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,128,power_law_1.01,0.08330240249633789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,128,power_law_1.01,0.08432000279426574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,128,power_law_1.2,0.08488320112228394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,128,power_law_1.2,0.08814719915390015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,16,balanced,0.09894933303197224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,16,balanced,0.10011200110117595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,16,power_law_1.01,0.1012992024421692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,16,power_law_1.01,0.10188159942626954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,16,power_law_1.2,0.10582400560379028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,16,power_law_1.2,0.10606080293655396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,2,balanced,0.20213866233825684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,2,balanced,0.2055199940999349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,2,power_law_1.01,0.22339200973510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,2,power_law_1.01,0.22373759746551514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,2,power_law_1.2,0.2265984058380127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,2,power_law_1.2,0.2278143882751465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,32,balanced,0.09353599945704143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,32,balanced,0.09515733520189922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,32,power_law_1.01,0.09411839842796325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,32,power_law_1.01,0.09505280256271362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,32,power_law_1.2,0.09552639722824097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,32,power_law_1.2,0.09623680114746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,4,balanced,0.1465173363685608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,4,balanced,0.14756266276041666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,4,power_law_1.01,0.15466879606246947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,4,power_law_1.01,0.15602560043334962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,4,power_law_1.2,0.16049280166625976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,4,power_law_1.2,0.16085120439529418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,64,balanced,0.0841919978459676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,64,balanced,0.0848640004793803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,64,power_law_1.01,0.0871295988559723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,64,power_law_1.01,0.08798720240592957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,64,power_law_1.2,0.09070720076560974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,64,power_law_1.2,0.09141759872436524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,8,balanced,0.1111306647459666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,8,balanced,0.1116480032602946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,8,power_law_1.01,0.12443519830703735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,8,power_law_1.01,0.1279680013656616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,8,power_law_1.2,0.12688640356063843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,1,8,power_law_1.2,0.12773120403289795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,2,1,balanced,0.18900799751281738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,2,1,balanced,0.19086933135986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,2,1,power_law_1.01,0.21000959873199462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,2,1,power_law_1.01,0.21011199951171874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,2,1,power_law_1.2,0.21346559524536132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,2,1,power_law_1.2,0.2149951934814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,4,1,balanced,0.1387999951839447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,4,1,balanced,0.1401653289794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,4,1,power_law_1.01,0.14510719776153563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,4,1,power_law_1.01,0.14645760059356688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,4,1,power_law_1.2,0.14727040529251098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2048,768,8,128,4,1,power_law_1.2,0.1475775957107544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,1,balanced,0.6976213455200195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,1,balanced,0.7044106324513754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,1,power_law_1.01,0.7702847957611084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,1,power_law_1.01,0.7769216060638428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,1,power_law_1.2,0.7931392192840576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,1,power_law_1.2,0.7981056213378906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,128,balanced,0.11373333136240642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,128,balanced,0.1151626706123352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,128,power_law_1.01,0.11776000261306763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,128,power_law_1.01,0.11912319660186768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,128,power_law_1.2,0.12290560007095337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,128,power_law_1.2,0.12364799976348877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,16,balanced,0.15224533279736838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,16,balanced,0.152319997549057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,16,power_law_1.01,0.16325759887695312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,16,power_law_1.01,0.16811519861221313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,16,power_law_1.2,0.17082879543304444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,16,power_law_1.2,0.1728320002555847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,2,balanced,0.45767998695373535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,2,balanced,0.45826133092244464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,2,power_law_1.01,0.475219202041626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,2,power_law_1.01,0.4854400157928467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,2,power_law_1.2,0.4742720127105713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,2,power_law_1.2,0.5042880058288575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,32,balanced,0.12737066547075906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,32,balanced,0.1276639997959137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,32,power_law_1.01,0.13614720106124878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,32,power_law_1.01,0.13787519931793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,32,power_law_1.2,0.14521600008010865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,32,power_law_1.2,0.14997119903564454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,4,balanced,0.29130132993062335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,4,balanced,0.29171733061472577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,4,power_law_1.01,0.30543999671936034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,4,power_law_1.01,0.3068288087844849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,4,power_law_1.2,0.32039039134979247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,4,power_law_1.2,0.32520959377288816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,64,balanced,0.1172160009543101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,64,balanced,0.11734933654467265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,64,power_law_1.01,0.1242751955986023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,64,power_law_1.01,0.12444800138473511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,64,power_law_1.2,0.128985595703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,64,power_law_1.2,0.12920960187911987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,8,balanced,0.20172800620396933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,8,balanced,0.20220800240834555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,8,power_law_1.01,0.21350400447845458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,8,power_law_1.01,0.22156798839569092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,8,power_law_1.2,0.22003839015960694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,1,8,power_law_1.2,0.22189440727233886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,16,1,balanced,0.2775626579920451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,16,1,balanced,0.277893324693044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,16,1,power_law_1.01,0.2956928014755249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,16,1,power_law_1.01,0.3006975889205933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,16,1,power_law_1.2,0.3281791925430298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,16,1,power_law_1.2,0.32965118885040284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,2,1,balanced,0.44544533888498944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,2,1,balanced,0.44648532072703045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,2,1,power_law_1.01,0.4654719829559326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,2,1,power_law_1.01,0.4662784099578857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,2,1,power_law_1.2,0.4737919807434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,2,1,power_law_1.2,0.4784639835357666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,32,1,balanced,0.22527466217676798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,32,1,balanced,0.22553600867589316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,32,1,power_law_1.01,0.2466048002243042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,32,1,power_law_1.01,0.2478015899658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,32,1,power_law_1.2,0.2680576086044312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,32,1,power_law_1.2,0.2736768007278442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,4,1,balanced,0.2748960057894389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,4,1,balanced,0.27509866158167523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,4,1,power_law_1.01,0.2833983898162842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,4,1,power_law_1.01,0.28444159030914307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,4,1,power_law_1.2,0.2958463907241821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,4,1,power_law_1.2,0.3007040023803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,8,1,balanced,0.36211200555165607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,8,1,balanced,0.3628213405609131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,8,1,power_law_1.01,0.40170879364013673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,8,1,power_law_1.01,0.40633602142333985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,8,1,power_law_1.2,0.40508160591125486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,2688,1856,6,128,8,1,power_law_1.2,0.4084479808807373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,1,balanced,1.406069278717041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,1,balanced,1.4525119463602703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,1,power_law_1.01,1.3688128471374512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,1,power_law_1.01,1.3690560340881348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,1,power_law_1.2,1.4099007606506349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,1,power_law_1.2,1.4329919815063477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,128,balanced,0.15633066495259604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,128,balanced,0.15782933433850607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,128,power_law_1.01,0.15920000076293944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,128,power_law_1.01,0.16113920211791993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,128,power_law_1.2,0.1630784034729004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,128,power_law_1.2,0.16352640390396117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,16,balanced,0.23460266987482706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,16,balanced,0.23493333657582602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,16,power_law_1.01,0.23648641109466553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,16,power_law_1.01,0.24031999111175537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,16,power_law_1.2,0.24642560482025147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,16,power_law_1.2,0.24649600982666015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,2,balanced,0.7895840009053549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,2,balanced,0.7904213269551595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,2,power_law_1.01,0.7560383796691894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,2,power_law_1.01,0.7721983909606933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,2,power_law_1.2,0.7980991840362549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,2,power_law_1.2,0.809721565246582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,256,balanced,0.1523253321647644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,256,balanced,0.15405866503715515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,256,power_law_1.01,0.15354880094528198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,256,power_law_1.01,0.15539200305938722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,256,power_law_1.2,0.1575551986694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,256,power_law_1.2,0.1586624026298523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,32,balanced,0.19083199898401895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,32,balanced,0.19092265764872232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,32,power_law_1.01,0.19664640426635743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,32,power_law_1.01,0.19839359521865846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,32,power_law_1.2,0.20638079643249513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,32,power_law_1.2,0.21012480258941652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,4,balanced,0.47926398118336994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,4,balanced,0.4792960087458293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,4,power_law_1.01,0.47223677635192873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,4,power_law_1.01,0.4723328113555908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,4,power_law_1.2,0.4794367790222168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,4,power_law_1.2,0.49120001792907714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,64,balanced,0.1662773291269938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,64,balanced,0.16660267114639282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,64,power_law_1.01,0.17070080041885377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,64,power_law_1.01,0.17181440591812133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,64,power_law_1.2,0.1741696000099182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,64,power_law_1.2,0.17794560194015502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,8,balanced,0.3141653339068095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,8,balanced,0.3157599965731303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,8,power_law_1.01,0.3144256114959717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,8,power_law_1.01,0.32272000312805177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,8,power_law_1.2,0.33018879890441893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,1,8,power_law_1.2,0.335263991355896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,16,1,balanced,0.23422932624816895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,16,1,balanced,0.23435733715693155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,16,1,power_law_1.01,0.23082239627838136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,16,1,power_law_1.01,0.23136000633239745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,16,1,power_law_1.2,0.2371135950088501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,16,1,power_law_1.2,0.23751039505004884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,2,1,balanced,0.7702506383260092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,2,1,balanced,0.7722133000691732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,2,1,power_law_1.01,0.7478655815124512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,2,1,power_law_1.01,0.748307180404663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,2,1,power_law_1.2,0.7811840057373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,2,1,power_law_1.2,0.7835775852203369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,32,1,balanced,0.18523732821146646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,32,1,balanced,0.18540799617767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,32,1,power_law_1.01,0.1859328031539917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,32,1,power_law_1.01,0.18707200288772582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,32,1,power_law_1.2,0.18880640268325805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,32,1,power_law_1.2,0.1889855980873108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,4,1,balanced,0.45774932702382404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,4,1,balanced,0.45846935113271076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,4,1,power_law_1.01,0.4460288047790527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,4,1,power_law_1.01,0.44999041557312014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,4,1,power_law_1.2,0.45819520950317383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,4,1,power_law_1.2,0.4597760200500488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,8,1,balanced,0.2956533432006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,8,1,balanced,0.29703466097513836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,8,1,power_law_1.01,0.29164800643920896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,8,1,power_law_1.01,0.2918976068496704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,8,1,power_law_1.2,0.2974208116531372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,3072,1536,8,256,8,1,power_law_1.2,0.30122239589691163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,1,balanced,1.0535679658253987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,1,balanced,1.0610026518503826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,1,power_law_1.01,1.3446080207824707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,1,power_law_1.01,1.3496831893920898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,1,power_law_1.2,1.3323840141296386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,1,power_law_1.2,1.3478591918945313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,2,balanced,0.5526826779047648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,2,balanced,0.5537439982096354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,2,power_law_1.01,0.7640768051147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,2,power_law_1.01,0.7929088115692139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,2,power_law_1.2,0.8022975921630859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,2,power_law_1.2,0.8168831825256347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,4,balanced,0.3949173291524251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,4,balanced,0.39708268642425537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,4,power_law_1.01,0.5814847946166992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,4,power_law_1.01,0.6357120037078857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,4,power_law_1.2,0.5449664115905761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,4,power_law_1.2,0.5769408226013184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,8,balanced,0.3205440044403076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,8,balanced,0.32434133688608807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,8,power_law_1.01,0.4614399909973145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,8,power_law_1.01,0.46670079231262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,8,power_law_1.2,0.4799232006072998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,1,8,power_law_1.2,0.4801472187042236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,16,1,balanced,0.1006666620572408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,16,1,balanced,0.10113599896430969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,16,1,power_law_1.01,0.11260160207748413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,16,1,power_law_1.01,0.11535359621047973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,16,1,power_law_1.2,0.10853760242462158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,16,1,power_law_1.2,0.11904640197753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,2,1,balanced,0.5247893333435059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,2,1,balanced,0.5290773312250773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,2,1,power_law_1.01,0.6252927780151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,2,1,power_law_1.01,0.62773118019104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,2,1,power_law_1.2,0.6293759822845459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,2,1,power_law_1.2,0.6304512023925781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,32,1,balanced,0.08450667063395183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,32,1,balanced,0.0846453309059143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,32,1,power_law_1.01,0.0900160014629364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,32,1,power_law_1.01,0.09148160219192505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,32,1,power_law_1.2,0.08932480216026306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,32,1,power_law_1.2,0.09176959991455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,4,1,balanced,0.28574933608373004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,4,1,balanced,0.2871146599451701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,4,1,power_law_1.01,0.32060799598693845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,4,1,power_law_1.01,0.3207808017730713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,4,1,power_law_1.2,0.32194559574127196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,4,1,power_law_1.2,0.3281599998474121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,8,1,balanced,0.1634773313999176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,8,1,balanced,0.1641279955705007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,8,1,power_law_1.01,0.18291200399398805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,8,1,power_law_1.01,0.18970240354537965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,8,1,power_law_1.2,0.17756799459457398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,14336,2,8,8,1,power_law_1.2,0.17770240306854249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,1,balanced,0.986016035079956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,1,balanced,0.9917706648508707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,1,power_law_1.01,1.0911040306091309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,1,power_law_1.01,1.123020839691162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,1,power_law_1.2,1.126028823852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,1,power_law_1.2,1.1289664268493653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,128,balanced,0.15093866984049478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,128,balanced,0.1511626640955607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,128,power_law_1.01,0.15387519598007202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,128,power_law_1.01,0.15411200523376464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,128,power_law_1.2,0.15896960496902465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,128,power_law_1.2,0.1606592059135437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,16,balanced,0.18954666455586752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,16,balanced,0.1904533306757609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,16,power_law_1.01,0.2184448003768921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,16,power_law_1.01,0.2190783977508545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,16,power_law_1.2,0.22639360427856445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,16,power_law_1.2,0.2298367977142334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,2,balanced,0.5833973487218221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,2,balanced,0.5849013328552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,2,power_law_1.01,0.6343039989471435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,2,power_law_1.01,0.6476799964904785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,2,power_law_1.2,0.6510591983795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,2,power_law_1.2,0.6678080081939697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,32,balanced,0.166293332974116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,32,balanced,0.16642133394877115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,32,power_law_1.01,0.1813696026802063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,32,power_law_1.01,0.18190079927444458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,32,power_law_1.2,0.19507839679718017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,32,power_law_1.2,0.1956287980079651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,4,balanced,0.35492265224456787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,4,balanced,0.35497065385182697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,4,power_law_1.01,0.39518721103668214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,4,power_law_1.01,0.3978048086166382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,4,power_law_1.2,0.39886720180511476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,4,power_law_1.2,0.4197887897491455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,64,balanced,0.1556000014146169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,64,balanced,0.15652267138163248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,64,power_law_1.01,0.16391680240631104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,64,power_law_1.01,0.16447360515594484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,64,power_law_1.2,0.16684800386428833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,64,power_law_1.2,0.17196799516677858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,8,balanced,0.25490132967631024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,8,balanced,0.25521065791447956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,8,power_law_1.01,0.28657920360565187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,8,power_law_1.01,0.2888128042221069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,8,power_law_1.2,0.29231359958648684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,1,8,power_law_1.2,0.30399360656738283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,16,1,balanced,0.18664000431696573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,16,1,balanced,0.18851200739542642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,16,1,power_law_1.01,0.22415359020233155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,16,1,power_law_1.01,0.22620160579681398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,16,1,power_law_1.2,0.22607998847961425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,16,1,power_law_1.2,0.22822399139404298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,2,1,balanced,0.49169600009918213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,2,1,balanced,0.49593067169189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,2,1,power_law_1.01,0.5630720138549805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,2,1,power_law_1.01,0.5647103786468506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,2,1,power_law_1.2,0.5841856002807617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,2,1,power_law_1.2,0.5862336158752441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,32,1,balanced,0.16828266779581705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,32,1,balanced,0.16846932967503866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,32,1,power_law_1.01,0.17812479734420777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,32,1,power_law_1.01,0.17893760204315184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,32,1,power_law_1.2,0.17982079982757568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,32,1,power_law_1.2,0.18157440423965454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,4,1,balanced,0.33373332023620605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,4,1,balanced,0.3349226713180542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,4,1,power_law_1.01,0.3730751991271973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,4,1,power_law_1.01,0.3779072046279907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,4,1,power_law_1.2,0.38304638862609863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,8,1,balanced,0.24406933784484863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,8,1,balanced,0.2477653423945109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,8,1,power_law_1.01,0.2549504041671753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,8,1,power_law_1.01,0.25623040199279784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,8,1,power_law_1.2,0.25734400749206543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,1536,8,128,8,1,power_law_1.2,0.2594815969467163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,1,balanced,6.71779187520345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,1,balanced,6.853061040242513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,1,power_law_1.01,6.855039978027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,1,power_law_1.01,7.071046447753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,1,power_law_1.2,7.38897933959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,1,power_law_1.2,7.438201904296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,128,balanced,0.5369919935862223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,128,balanced,0.5373066663742065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,128,power_law_1.01,0.5669568061828614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,128,power_law_1.01,0.572160005569458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,128,power_law_1.2,0.5822207927703857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,128,power_law_1.2,0.5822847843170166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,16,balanced,0.8640426794687907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,16,balanced,0.8642346858978271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,16,power_law_1.01,0.9203455924987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,16,power_law_1.01,0.923737621307373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,16,power_law_1.2,0.918284797668457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,16,power_law_1.2,0.9409152030944824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,2,balanced,3.5209118525187173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,2,balanced,3.6346559524536133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,2,power_law_1.01,3.761740875244141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,2,power_law_1.01,3.763616180419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,2,power_law_1.2,3.7516414642333986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,2,power_law_1.2,3.8921409606933595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,256,balanced,0.5180960098902384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,256,balanced,0.5186026493708292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,256,power_law_1.01,0.5370368003845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,256,power_law_1.01,0.5398848056793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,256,power_law_1.2,0.552294397354126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,256,power_law_1.2,0.5525760173797607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,32,balanced,0.6846240361531576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,32,balanced,0.6850132942199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,32,power_law_1.01,0.7230527877807618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,32,power_law_1.01,0.7270207881927491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,32,power_law_1.2,0.7330687999725342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,32,power_law_1.2,0.7359295845031738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,4,balanced,1.9720746676127117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,4,balanced,2.0149973233540854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,4,power_law_1.01,2.027091217041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,4,power_law_1.01,2.0792640686035155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,4,power_law_1.2,2.0726911544799806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,4,power_law_1.2,2.1518527984619142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,64,balanced,0.5946133136749268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,64,balanced,0.5952479839324951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,64,power_law_1.01,0.6162943840026855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,64,power_law_1.01,0.6194431781768799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,64,power_law_1.2,0.6395391941070556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,64,power_law_1.2,0.6415808200836182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,8,balanced,1.238810698191325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,8,balanced,1.2396639982859294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,8,power_law_1.01,1.290272045135498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,8,power_law_1.01,1.2948351860046388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,8,power_law_1.2,1.3198207855224608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,1,8,power_law_1.2,1.3239616394042968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,16,1,balanced,1.6878132820129395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,16,1,balanced,1.6893760363260906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,16,1,power_law_1.01,1.7863807678222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,16,1,power_law_1.01,1.8131263732910157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,16,1,power_law_1.2,1.8493759155273437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,16,1,power_law_1.2,1.871552085876465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,2,1,balanced,2.943690617879232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,2,1,balanced,2.9610398610432944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,2,1,power_law_1.01,3.238259124755859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,2,1,power_law_1.01,3.244780731201172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,2,1,power_law_1.2,3.371263885498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,2,1,power_law_1.2,3.471750259399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,32,1,balanced,1.4320799509684246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,32,1,balanced,1.4325920740763347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,32,1,power_law_1.01,1.5442048072814942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,32,1,power_law_1.01,1.5544447898864746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,32,1,power_law_1.2,1.6043712615966796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,32,1,power_law_1.2,1.6237247467041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,4,1,balanced,2.5595199267069497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,4,1,balanced,2.559685389200846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,4,1,power_law_1.01,2.7194623947143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,4,1,power_law_1.01,2.7367359161376954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,4,1,power_law_1.2,2.7662847518920897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,4,1,power_law_1.2,2.7753856658935545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,8,1,balanced,1.1154826482137044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,8,1,balanced,1.1173226833343506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,8,1,power_law_1.01,1.1650239944458007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,8,1,power_law_1.01,1.1721983909606934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,8,1,power_law_1.2,1.2032320022583007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,4096,2688,22,512,8,1,power_law_1.2,1.2221695899963378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,1,balanced,1.8121333122253418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,1,balanced,1.8482666015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,1,power_law_1.01,2.2899263381958006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,1,power_law_1.01,2.4390655517578126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,1,power_law_1.2,2.2565183639526367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,1,power_law_1.2,2.260268783569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,2,balanced,0.906165361404419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,2,balanced,0.908618688583374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,2,power_law_1.01,1.2125632286071777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,2,power_law_1.01,1.2617088317871095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,2,power_law_1.2,1.175046443939209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,2,power_law_1.2,1.2399680137634277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,4,balanced,0.530351996421814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,4,balanced,0.5314293305079142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,4,power_law_1.01,0.9038975715637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,4,power_law_1.01,0.9102272033691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,4,power_law_1.2,0.8965375900268555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,4,power_law_1.2,0.952518367767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,8,balanced,0.4023733139038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,8,balanced,0.4029386838277181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,8,power_law_1.01,0.738099193572998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,8,power_law_1.01,0.7742080211639404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,8,power_law_1.2,0.6833727836608887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,1,8,power_law_1.2,0.7235712051391602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,16,1,balanced,0.14131733775138855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,16,1,balanced,0.1430346667766571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,16,1,power_law_1.01,0.19197440147399902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,16,1,power_law_1.01,0.1960576057434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,16,1,power_law_1.2,0.19368319511413573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,16,1,power_law_1.2,0.1953984022140503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,2,1,balanced,0.8389279842376709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,2,1,balanced,0.8449866771697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,2,1,power_law_1.01,1.0400832176208497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,2,1,power_law_1.01,1.0456512451171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,2,1,power_law_1.2,1.0285632133483886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,2,1,power_law_1.2,1.0380543708801269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,32,1,balanced,0.11718933780988057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,32,1,balanced,0.11749333143234253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,32,1,power_law_1.01,0.1276800036430359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,32,1,power_law_1.01,0.12986880540847778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,32,1,power_law_1.2,0.12737280130386353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,32,1,power_law_1.2,0.13007359504699706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,4,1,balanced,0.43792001406351727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,4,1,balanced,0.4478986660639445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,4,1,power_law_1.01,0.5178688049316407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,4,1,power_law_1.01,0.5256447792053223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,4,1,power_law_1.2,0.5239999771118165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,4,1,power_law_1.2,0.5319808006286622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,8,1,balanced,0.23788267374038696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,8,1,balanced,0.23922133445739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,8,1,power_law_1.01,0.2961087942123413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,8,1,power_law_1.01,0.29624960422515867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,8,1,power_law_1.2,0.29305601119995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,16384,2,8,8,1,power_law_1.2,0.2946943998336792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,1,balanced,3.702922821044922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,1,balanced,3.804880142211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,1,power_law_1.01,3.6153537750244142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,1,power_law_1.01,3.66308479309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,1,power_law_1.2,3.6064193725585936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,1,power_law_1.2,3.800511932373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,128,balanced,0.2589973409970601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,128,balanced,0.2595840096473694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,128,power_law_1.01,0.27171199321746825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,128,power_law_1.01,0.27308800220489504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,128,power_law_1.2,0.27876479625701905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,128,power_law_1.2,0.28382720947265627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,16,balanced,0.44488000869750977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,16,balanced,0.4461173216501872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,16,power_law_1.01,0.45246081352233886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,16,power_law_1.01,0.4668032169342041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,16,power_law_1.2,0.47518720626831057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,16,power_law_1.2,0.47873921394348146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,2,balanced,1.9170133272806804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,2,balanced,2.0043253898620605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,2,power_law_1.01,1.8871423721313476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,2,power_law_1.01,1.8965631484985352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,2,power_law_1.2,1.9704511642456055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,2,power_law_1.2,1.9778303146362304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,256,balanced,0.25249600410461426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,256,balanced,0.2530240019162496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,256,power_law_1.01,0.25691521167755127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,256,power_law_1.01,0.25779199600219727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,256,power_law_1.2,0.2673664093017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,256,power_law_1.2,0.2702719926834106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,32,balanced,0.3428959846496582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,32,balanced,0.3430826663970947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,32,power_law_1.01,0.35196800231933595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,32,power_law_1.01,0.355295991897583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,32,power_law_1.2,0.3645119905471802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,32,power_law_1.2,0.36833920478820803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,4,balanced,1.0709653695424397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,4,balanced,1.0786506334940593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,4,power_law_1.01,1.0323007583618165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,4,power_law_1.01,1.0552127838134766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,4,power_law_1.2,1.1092927932739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,4,power_law_1.2,1.1260736465454102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,64,balanced,0.2799999912579854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,64,balanced,0.281061331431071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,64,power_law_1.01,0.2985152006149292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,64,power_law_1.01,0.29967360496520995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,64,power_law_1.2,0.2974015951156616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,64,power_law_1.2,0.3158720016479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,8,balanced,0.6521439949671427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,8,balanced,0.6539093255996704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,8,power_law_1.01,0.6562111854553223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,8,power_law_1.01,0.6641407966613769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,8,power_law_1.2,0.6788864135742188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,1,8,power_law_1.2,0.6989183902740479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,16,1,balanced,0.4424320062001546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,16,1,balanced,0.4428906838099162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,16,1,power_law_1.01,0.43537278175354005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,16,1,power_law_1.01,0.43639039993286133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,16,1,power_law_1.2,0.44559359550476074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,16,1,power_law_1.2,0.447705602645874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,2,1,balanced,1.8698879877726238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,2,1,balanced,1.9530986150105794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,2,1,power_law_1.01,1.7986751556396485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,2,1,power_law_1.01,1.8272703170776368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,2,1,power_law_1.2,1.919468879699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,2,1,power_law_1.2,1.9230655670166015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,32,1,balanced,0.3427199920018514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,32,1,balanced,0.3447786569595337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,32,1,power_law_1.01,0.33943679332733157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,32,1,power_law_1.01,0.34558720588684083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,32,1,power_law_1.2,0.34702720642089846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,32,1,power_law_1.2,0.3532991886138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,4,1,balanced,1.0268373489379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,4,1,balanced,1.0346026420593262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,4,1,power_law_1.01,0.9990976333618165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,4,1,power_law_1.01,1.0344639778137208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,4,1,power_law_1.2,1.056396770477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,4,1,power_law_1.2,1.0642623901367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,8,1,balanced,0.6470986604690552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,8,1,balanced,0.6478240092595419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,8,1,power_law_1.01,0.6342463970184327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,8,1,power_law_1.01,0.6352704048156739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,8,1,power_law_1.2,0.6518847942352295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2048,8,256,8,1,power_law_1.2,0.6545472145080566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,1,balanced,2.8698132832845054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,1,balanced,2.8784427642822266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,1,power_law_1.01,3.214662551879883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,1,power_law_1.01,3.3062206268310548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,1,power_law_1.2,3.345062255859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,1,power_law_1.2,3.3453441619873048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,16,balanced,0.37720000743865967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,16,balanced,0.3794506788253784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,16,power_law_1.01,0.4290112018585205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,16,power_law_1.01,0.4390592098236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,16,power_law_1.2,0.44185600280761717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,16,power_law_1.2,0.4586495876312256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,2,balanced,1.5347466468811035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,2,balanced,1.5713760058085124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,2,power_law_1.01,1.6458623886108399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,2,power_law_1.01,1.6686399459838868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,2,power_law_1.2,1.7177984237670898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,2,power_law_1.2,1.7750080108642579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,32,balanced,0.2912213404973348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,32,balanced,0.29152532418568927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,32,power_law_1.01,0.33131520748138427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,32,power_law_1.01,0.3329472064971924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,32,power_law_1.2,0.34012160301208494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,32,power_law_1.2,0.35204479694366453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,4,balanced,0.8671573003133138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,4,balanced,0.8675200144449869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,4,power_law_1.01,0.9191231727600098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,4,power_law_1.01,0.9893247604370117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,4,power_law_1.2,0.9966655731201172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,4,power_law_1.2,1.0029312133789063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,8,balanced,0.5397173166275024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,8,balanced,0.5414559841156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,8,power_law_1.01,0.6035200119018554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,8,power_law_1.01,0.6036736011505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,8,power_law_1.2,0.6252416133880615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,1,8,power_law_1.2,0.6425663948059082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,16,1,balanced,0.367631991704305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,16,1,balanced,0.3692266543706258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,16,1,power_law_1.01,0.37920639514923093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,16,1,power_law_1.01,0.3824512004852295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,16,1,power_law_1.2,0.38819839954376223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,16,1,power_law_1.2,0.3930432081222534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,2,1,balanced,1.498586654663086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,2,1,balanced,1.5674559275309246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,2,1,power_law_1.01,1.5857279777526856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,2,1,power_law_1.01,1.6199552536010742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,2,1,power_law_1.2,1.622879981994629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,2,1,power_law_1.2,1.6534463882446289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,32,1,balanced,0.32945066690444946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,32,1,balanced,0.33027199904123944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,32,1,power_law_1.01,0.3438976049423218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,32,1,power_law_1.01,0.34415359497070314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,32,1,power_law_1.2,0.35043199062347413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,32,1,power_law_1.2,0.35140480995178225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,4,1,balanced,0.8415573438008627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,4,1,balanced,0.8433919747670492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,4,1,power_law_1.01,0.9027775764465332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,4,1,power_law_1.01,0.9056639671325684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,4,1,power_law_1.2,0.9130751609802246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,4,1,power_law_1.2,0.9151359558105469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,8,1,balanced,0.5015253225962321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,8,1,balanced,0.5030879974365234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,8,1,power_law_1.01,0.5619904041290283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,8,1,power_law_1.01,0.5657472133636474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,8,1,power_law_1.2,0.5702784061431885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,6144,2560,8,160,8,1,power_law_1.2,0.5729919910430908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,1,balanced,4.280991872151692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,1,balanced,4.372912089029948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,1,power_law_1.01,4.142534255981445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,1,power_law_1.01,4.217292785644531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,1,power_law_1.2,4.372959899902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,1,power_law_1.2,4.458777618408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,128,balanced,0.28775999943415326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,128,balanced,0.28969067335128784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,128,power_law_1.01,0.3025791883468628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,128,power_law_1.01,0.3044543981552124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,128,power_law_1.2,0.30462079048156737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,128,power_law_1.2,0.3137727975845337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,16,balanced,0.5042879978815714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,16,balanced,0.5050773223241171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,16,power_law_1.01,0.5098495960235596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,16,power_law_1.01,0.5216639995574951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,16,power_law_1.2,0.5361343860626221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,16,power_law_1.2,0.5525119781494141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,2,balanced,2.2873172760009766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,2,balanced,2.347248077392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,2,power_law_1.01,2.2014144897460937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,2,power_law_1.01,2.2075712203979494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,2,power_law_1.2,2.2205503463745115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,2,power_law_1.2,2.2880319595336913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,256,balanced,0.28380799293518066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,256,balanced,0.28481600681940716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,256,power_law_1.01,0.2823744058609009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,256,power_law_1.01,0.2832832098007202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,256,power_law_1.2,0.2934720039367676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,256,power_law_1.2,0.2968127965927124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,32,balanced,0.3811733325322469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,32,balanced,0.3815946578979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,32,power_law_1.01,0.392409610748291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,32,power_law_1.01,0.40186238288879395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,32,power_law_1.2,0.4104767799377441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,32,power_law_1.2,0.41605119705200194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,4,balanced,1.2378986676534016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,4,balanced,1.2385653654734294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,4,power_law_1.01,1.2301183700561524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,4,power_law_1.01,1.233638381958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,4,power_law_1.2,1.2504575729370118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,4,power_law_1.2,1.2669119834899902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,64,balanced,0.311898668607076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,64,balanced,0.3121440013249715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,64,power_law_1.01,0.3280064105987549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,64,power_law_1.01,0.33308160305023193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,64,power_law_1.2,0.3388351917266846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,64,power_law_1.2,0.34640638828277587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,8,balanced,0.7452853520711263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,8,balanced,0.7465866406758627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,8,power_law_1.01,0.7384511947631835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,8,power_law_1.01,0.7424895763397217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,8,power_law_1.2,0.7756224155426026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,1,8,power_law_1.2,0.796563196182251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,16,1,balanced,0.5092639923095703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,16,1,balanced,0.5108426809310913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,16,1,power_law_1.01,0.5040575981140136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,16,1,power_law_1.01,0.506112003326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,16,1,power_law_1.2,0.5178944110870362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,16,1,power_law_1.2,0.5184895992279053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,2,1,balanced,2.2626293500264487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,2,1,balanced,2.317274729410807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,2,1,power_law_1.01,2.1473663330078123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,2,1,power_law_1.01,2.1661823272705076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,2,1,power_law_1.2,2.2271488189697264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,2,1,power_law_1.2,2.3451200485229493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,32,1,balanced,0.3924853404362996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,32,1,balanced,0.39371200402577716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,32,1,power_law_1.01,0.39032959938049316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,32,1,power_law_1.01,0.39472639560699463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,32,1,power_law_1.2,0.4009984016418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,32,1,power_law_1.2,0.40208001136779786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,4,1,balanced,1.1929972966512044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,4,1,balanced,1.219493309656779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,4,1,power_law_1.01,1.1525952339172363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,4,1,power_law_1.01,1.1714752197265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,4,1,power_law_1.2,1.2378687858581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,4,1,power_law_1.2,1.2468992233276368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,8,1,balanced,0.7502613067626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,8,1,balanced,0.750607967376709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,8,1,power_law_1.01,0.7348671913146972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,8,1,power_law_1.01,0.7378240108489991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,8,1,power_law_1.2,0.753439998626709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,256,8,1,power_law_1.2,0.7576896190643311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,1,balanced,6.593109130859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,1,balanced,6.600976308186849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,1,power_law_1.01,5.643257522583008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,1,power_law_1.01,5.83507194519043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,1,power_law_1.2,6.01025276184082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,1,power_law_1.2,6.089900970458984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,128,balanced,0.3561813433965047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,128,balanced,0.3567626476287842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,128,power_law_1.01,0.35970559120178225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,128,power_law_1.01,0.36662399768829346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,128,power_law_1.2,0.37189760208129885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,128,power_law_1.2,0.3769216060638428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,16,balanced,0.6778666973114014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,16,balanced,0.6782560348510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,16,power_law_1.01,0.6405375957489013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,16,power_law_1.01,0.666483211517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,16,power_law_1.2,0.6671360015869141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,16,power_law_1.2,0.6758399963378906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,2,balanced,3.408538818359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,2,balanced,3.5228214263916016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,2,power_law_1.01,2.831449508666992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,2,power_law_1.01,2.91973762512207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,2,power_law_1.2,2.9384063720703124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,2,power_law_1.2,2.982067108154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,32,balanced,0.5028320153554281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,32,balanced,0.5031199852625529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,32,power_law_1.01,0.4978047847747803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,32,power_law_1.01,0.5083775997161866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,32,power_law_1.2,0.5060351848602295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,32,power_law_1.2,0.5064511775970459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,4,balanced,1.76801602045695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,4,balanced,1.769397258758545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,4,power_law_1.01,1.596390438079834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,4,power_law_1.01,1.6385343551635743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,4,power_law_1.2,1.6805248260498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,4,power_law_1.2,1.6917312622070313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,64,balanced,0.4015466769536336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,64,balanced,0.40174400806427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,64,power_law_1.01,0.3996351957321167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,64,power_law_1.01,0.4024320125579834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,64,power_law_1.2,0.4173567771911621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,64,power_law_1.2,0.4264959812164307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,8,balanced,1.051199992497762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,8,balanced,1.0515413284301758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,8,power_law_1.01,0.9249279975891114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,8,power_law_1.01,0.9477567672729492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,8,power_law_1.2,1.0113856315612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,1,8,power_law_1.2,1.0240127563476562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,16,1,balanced,0.7199093500773112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,16,1,balanced,0.7202826340993246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,16,1,power_law_1.01,0.6756927967071533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,16,1,power_law_1.01,0.6798143863677979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,16,1,power_law_1.2,0.6843008041381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,16,1,power_law_1.2,0.6867584228515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,2,1,balanced,3.3549814224243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,2,1,balanced,3.369413375854492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,2,1,power_law_1.01,2.823993682861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,2,1,power_law_1.01,2.865772819519043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,2,1,power_law_1.2,2.9863616943359377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,2,1,power_law_1.2,3.0283647537231446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,32,1,balanced,0.5750346581141154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,32,1,balanced,0.5757546822230021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,32,1,power_law_1.01,0.5419072151184082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,32,1,power_law_1.01,0.5490240097045899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,32,1,power_law_1.2,0.5510335922241211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,32,1,power_law_1.2,0.5512639999389648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,4,1,balanced,1.7871947288513184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,4,1,balanced,1.836400032043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,4,1,power_law_1.01,1.581331157684326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,4,1,power_law_1.01,1.5998784065246583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,4,1,power_law_1.2,1.6062911987304687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,4,1,power_law_1.2,1.623744010925293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,8,1,balanced,1.0822559992472331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,8,1,balanced,1.0838186740875244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,8,1,power_law_1.01,0.9557567596435547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,8,1,power_law_1.01,0.9626751899719238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,8,1,power_law_1.2,0.9708800315856934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1024,7168,2048,8,384,8,1,power_law_1.2,0.986348819732666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,1,balanced,1.2617013454437256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,1,balanced,1.2622079849243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,1,power_law_1.01,1.4180288314819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,1,power_law_1.01,1.4281408309936523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,1,power_law_1.2,1.4374719619750977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,1,power_law_1.2,1.4401472091674805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,128,balanced,0.5888426701227824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,128,balanced,0.5892320076624552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,128,power_law_1.01,0.6467008113861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,128,power_law_1.01,0.647603178024292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,128,power_law_1.2,0.6957183837890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,128,power_law_1.2,0.6978496074676513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,16,balanced,0.6461120049158732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,16,balanced,0.6463413238525391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,16,power_law_1.01,0.7127295970916748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,16,power_law_1.01,0.7238336086273194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,16,power_law_1.2,0.7392384052276612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,16,power_law_1.2,0.7739071846008301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,2,balanced,1.080730676651001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,2,balanced,1.083082675933838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,2,power_law_1.01,1.1744000434875488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,2,power_law_1.01,1.1767616271972656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,2,power_law_1.2,1.2297280311584473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,2,power_law_1.2,1.2726207733154298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,32,balanced,0.6127200126647949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,32,balanced,0.6153759956359863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,32,power_law_1.01,0.683187198638916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,32,power_law_1.01,0.6876992225646973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,32,power_law_1.2,0.7215167999267578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,32,power_law_1.2,0.7389567852020263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,4,balanced,0.8307519753774008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,4,balanced,0.8325760364532471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,4,power_law_1.01,0.9127743721008301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,4,power_law_1.01,0.9466943740844727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,4,power_law_1.2,0.9836159706115722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,4,power_law_1.2,1.0166336059570313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,64,balanced,0.5958986679712931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,64,balanced,0.5962186654408773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,64,power_law_1.01,0.6638783931732177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,64,power_law_1.01,0.6696512222290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,64,power_law_1.2,0.6987264156341553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,64,power_law_1.2,0.7090432167053222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,8,balanced,0.7086506684621176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,8,balanced,0.7090986569722494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,8,power_law_1.01,0.8035391807556153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,8,power_law_1.01,0.8101887702941895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,8,power_law_1.2,0.8040191650390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,1,8,power_law_1.2,0.8392704010009766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,2,1,balanced,0.9521653652191162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,2,1,balanced,0.9561973412831625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,2,1,power_law_1.01,1.0178048133850097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,2,1,power_law_1.01,1.019987201690674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,2,1,power_law_1.2,1.0265472412109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,2,1,power_law_1.2,1.0281984329223632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,4,1,balanced,0.7129173278808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,4,1,balanced,0.7161920070648193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,4,1,power_law_1.01,0.7492608070373535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,4,1,power_law_1.01,0.7500864028930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,4,1,power_law_1.2,0.7571072101593017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2048,768,8,128,4,1,power_law_1.2,0.7604159832000732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,1,balanced,3.1151679356892905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,1,balanced,3.1522773106892905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,1,power_law_1.01,3.0364864349365233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,1,power_law_1.01,3.096940803527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,1,power_law_1.2,3.0789119720458986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,1,power_law_1.2,3.1134016036987306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,128,balanced,0.7703466415405273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,128,balanced,0.7707146803538004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,128,power_law_1.01,0.9045760154724121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,128,power_law_1.01,0.9115391731262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,128,power_law_1.2,1.0240960121154785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,128,power_law_1.2,1.0509568214416505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,16,balanced,0.9052639802296957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,16,balanced,0.9053760369618734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,16,power_law_1.01,1.0647104263305665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,16,power_law_1.01,1.073798370361328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,16,power_law_1.2,1.1662528038024902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,16,power_law_1.2,1.1889023780822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,2,balanced,1.994655927022298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,2,balanced,2.0109386444091797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,2,power_law_1.01,2.1486591339111327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,2,power_law_1.01,2.1499008178710937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,2,power_law_1.2,2.3695999145507813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,2,power_law_1.2,2.4106752395629885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,32,balanced,0.8272799650828043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,32,balanced,0.8284800052642822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,32,power_law_1.01,0.9843839645385742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,32,power_law_1.01,0.9942208290100097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,32,power_law_1.2,1.0656384468078612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,32,power_law_1.2,1.1262144088745116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,4,balanced,1.3754560152689617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,4,balanced,1.3763680458068848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,4,power_law_1.01,1.5629440307617188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,4,power_law_1.01,1.6064191818237306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,4,power_law_1.2,1.6761215209960938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,4,power_law_1.2,1.7372671127319337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,64,balanced,0.7882186571756998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,64,balanced,0.7885653177897135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,64,power_law_1.01,0.9175488471984863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,64,power_law_1.01,0.9370368003845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,64,power_law_1.2,1.0293248176574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,64,power_law_1.2,1.0468159675598145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,8,balanced,1.061247984568278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,8,balanced,1.0618560314178467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,8,power_law_1.01,1.2543231964111328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,8,power_law_1.01,1.2675007820129394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,8,power_law_1.2,1.3054271697998048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,1,8,power_law_1.2,1.373305606842041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,16,1,balanced,1.410762627919515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,16,1,balanced,1.4119466145833333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,16,1,power_law_1.01,1.4492032051086425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,16,1,power_law_1.01,1.4509504318237305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,16,1,power_law_1.2,1.4644927978515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,16,1,power_law_1.2,1.469337558746338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,2,1,balanced,1.8809973398844402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,2,1,balanced,1.9271039962768555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,2,1,power_law_1.01,1.87969913482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,2,1,power_law_1.01,1.8879360198974608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,2,1,power_law_1.2,1.898796844482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,2,1,power_law_1.2,1.9101119995117188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,32,1,balanced,1.170570691426595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,32,1,balanced,1.1710879802703857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,32,1,power_law_1.01,1.2043519973754884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,32,1,power_law_1.01,1.2048000335693358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,32,1,power_law_1.2,1.2161151885986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,32,1,power_law_1.2,1.2172351837158204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,4,1,balanced,1.2012800375620525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,4,1,balanced,1.2048693497975667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,4,1,power_law_1.01,1.2272576332092284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,4,1,power_law_1.01,1.238259220123291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,4,1,power_law_1.2,1.2442879676818848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,4,1,power_law_1.2,1.2465279579162598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,8,1,balanced,1.7797226905822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,8,1,balanced,1.7815732955932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,8,1,power_law_1.01,1.818387222290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,8,1,power_law_1.01,1.825721549987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,8,1,power_law_1.2,1.8395647048950194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,2688,1856,6,128,8,1,power_law_1.2,1.8422592163085938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,1,balanced,4.1359148025512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,1,balanced,4.37665589650472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,1,power_law_1.01,4.619929504394531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,1,power_law_1.01,4.636371231079101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,1,power_law_1.2,4.623328018188476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,1,power_law_1.2,4.7954753875732425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,128,balanced,0.9138240019480387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,128,balanced,0.9168586730957031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,128,power_law_1.01,1.0105600357055664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,128,power_law_1.01,1.0242112159729004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,128,power_law_1.2,1.0842304229736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,128,power_law_1.2,1.1079039573669434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,16,balanced,1.0887893040974934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,16,balanced,1.0899466673533122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,16,power_law_1.01,1.2609984397888183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,16,power_law_1.01,1.2715392112731934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,16,power_law_1.2,1.3144191741943358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,16,power_law_1.2,1.3754176139831542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,2,balanced,2.559706687927246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,2,balanced,2.5882879892985025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,2,power_law_1.01,2.7940095901489257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,2,power_law_1.01,2.825721549987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,2,power_law_1.2,2.880710411071777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,2,power_law_1.2,2.99224967956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,256,balanced,0.9030133088429769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,256,balanced,0.9046773115793864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,256,power_law_1.01,0.9841343879699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,256,power_law_1.01,0.9875200271606446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,256,power_law_1.2,1.105951976776123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,256,power_law_1.2,1.1061951637268066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,32,balanced,0.9918453693389893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,32,balanced,0.9946239789326986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,32,power_law_1.01,1.1171968460083008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,32,power_law_1.01,1.147270393371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,32,power_law_1.2,1.21212797164917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,32,power_law_1.2,1.237504005432129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,4,balanced,1.6862880388895671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,4,balanced,1.6945600509643555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,4,power_law_1.01,1.9701503753662108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,4,power_law_1.01,2.010867118835449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,4,power_law_1.2,1.9869056701660157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,4,power_law_1.2,2.0395904541015626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,64,balanced,0.9396373430887858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,64,balanced,0.9397706985473633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,64,power_law_1.01,1.0607040405273438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,64,power_law_1.01,1.0685952186584473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,64,power_law_1.2,1.1429887771606446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,64,power_law_1.2,1.1780799865722655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,8,balanced,1.2861333688100178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,8,balanced,1.2894666989644368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,8,power_law_1.01,1.509836769104004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,8,power_law_1.01,1.5264191627502441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,8,power_law_1.2,1.555123233795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,1,8,power_law_1.2,1.5815679550170898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,16,1,balanced,0.9006720383961996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,16,1,balanced,0.9030933380126953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,16,1,power_law_1.01,0.975551986694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,16,1,power_law_1.01,0.9777600288391113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,16,1,power_law_1.2,0.9842944145202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,16,1,power_law_1.2,0.9884480476379395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,2,1,balanced,2.398357391357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,2,1,balanced,2.3985279401143393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,2,1,power_law_1.01,2.5243967056274412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,2,1,power_law_1.01,2.5744384765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,2,1,power_law_1.2,2.5887168884277343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,2,1,power_law_1.2,2.5947328567504884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,32,1,balanced,0.7638773123423258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,32,1,balanced,0.7646453380584717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,32,1,power_law_1.01,0.8323200225830079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,32,1,power_law_1.01,0.8336000442504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,32,1,power_law_1.2,0.842899227142334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,32,1,power_law_1.2,0.8442048072814942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,4,1,balanced,1.4311572710673015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,4,1,balanced,1.4340747197469075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,4,1,power_law_1.01,1.5722880363464355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,4,1,power_law_1.01,1.5726719856262208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,4,1,power_law_1.2,1.6016960144042969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,4,1,power_law_1.2,1.6034879684448242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,8,1,balanced,1.049397309621175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,8,1,balanced,1.049829324086507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,8,1,power_law_1.01,1.1379776000976562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,8,1,power_law_1.01,1.1384703636169433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,8,1,power_law_1.2,1.1506752014160155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,3072,1536,8,256,8,1,power_law_1.2,1.150937557220459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,1,balanced,11.260453542073568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,1,balanced,11.297322591145834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,1,power_law_1.01,11.000511932373048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,1,power_law_1.01,11.206265258789063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,1,power_law_1.2,11.158879852294922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,1,power_law_1.2,11.263231658935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,2,balanced,5.991525650024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,2,balanced,6.1189225514729815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,2,power_law_1.01,7.7620094299316404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,2,power_law_1.01,8.284710693359376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,2,power_law_1.2,8.196089935302734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,2,power_law_1.2,8.805158233642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,4,balanced,3.480981190999349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,4,balanced,3.513893445332845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,4,power_law_1.01,6.122975921630859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,4,power_law_1.01,7.372831726074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,4,power_law_1.2,6.062355041503906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,4,power_law_1.2,6.623391723632812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,8,balanced,2.311583995819092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,8,balanced,2.3172480265299478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,8,power_law_1.01,5.0574592590332035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,8,power_law_1.01,5.109875106811524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,8,power_law_1.2,5.746342468261719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,1,8,power_law_1.2,6.038956832885742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,16,1,balanced,0.7543040116628011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,16,1,balanced,0.7544000148773193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,16,1,power_law_1.01,0.7706048011779785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,16,1,power_law_1.01,0.7862847805023193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,16,1,power_law_1.2,0.7757503986358643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,16,1,power_law_1.2,0.7796351909637451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,2,1,balanced,4.943589210510254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,2,1,balanced,5.081247965494792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,2,1,power_law_1.01,4.790182495117188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,2,1,power_law_1.01,5.032524871826172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,2,1,power_law_1.2,4.836851119995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,2,1,power_law_1.2,4.900179290771485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,32,1,balanced,0.500485340754191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,32,1,balanced,0.5022986729939779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,32,1,power_law_1.01,0.5110015869140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,32,1,power_law_1.01,0.511411190032959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,32,1,power_law_1.2,0.51112961769104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,32,1,power_law_1.2,0.5130815982818604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,4,1,balanced,2.374015967051188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,4,1,balanced,2.541370709737142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,4,1,power_law_1.01,2.460767936706543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,4,1,power_law_1.01,2.468351936340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,4,1,power_law_1.2,2.452217674255371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,4,1,power_law_1.2,2.4818752288818358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,8,1,balanced,1.306069294611613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,8,1,balanced,1.308245340983073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,8,1,power_law_1.01,1.300166416168213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,8,1,power_law_1.01,1.3295488357543945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,8,1,power_law_1.2,1.324441623687744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,14336,2,8,8,1,power_law_1.2,1.3262335777282714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,1,balanced,4.882389386494954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,1,balanced,4.900597254435222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,1,power_law_1.01,5.078630447387695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,1,power_law_1.01,5.283379364013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,1,power_law_1.2,4.944793701171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,1,power_law_1.2,4.9900672912597654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,128,balanced,1.030191977818807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,128,balanced,1.0305759906768799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,128,power_law_1.01,1.222719955444336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,128,power_law_1.01,1.233011245727539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,128,power_law_1.2,1.4224127769470214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,128,power_law_1.2,1.423040008544922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,16,balanced,1.2372852961222331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,16,balanced,1.2394346396128337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,16,power_law_1.01,1.5318016052246093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,16,power_law_1.01,1.547436809539795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,16,power_law_1.2,1.677689552307129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,16,power_law_1.2,1.7867904663085938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,2,balanced,2.9691893259684243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,2,balanced,3.080538749694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,2,power_law_1.01,3.2381824493408202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,2,power_law_1.01,3.329792022705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,2,power_law_1.2,3.5583934783935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,2,power_law_1.2,3.5855297088623046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,32,balanced,1.119157314300537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,32,balanced,1.1237226327260335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,32,power_law_1.01,1.3744640350341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,32,power_law_1.01,1.395257568359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,32,power_law_1.2,1.497760009765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,32,power_law_1.2,1.5723199844360352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,4,balanced,1.957738717397054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,4,balanced,1.9634025891621907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,4,power_law_1.01,2.420217514038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,4,power_law_1.01,2.511756706237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,4,power_law_1.2,2.3103616714477537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,4,power_law_1.2,2.3550848007202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,64,balanced,1.0620319843292236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,64,balanced,1.0639999707539876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,64,power_law_1.01,1.2846528053283692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,64,power_law_1.01,1.3149503707885741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,64,power_law_1.2,1.4901439666748046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,64,power_law_1.2,1.534278392791748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,8,balanced,1.4767519632975261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,8,balanced,1.4769387245178223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,8,power_law_1.01,1.8694528579711913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,8,power_law_1.01,1.8949567794799804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,8,power_law_1.2,1.9277055740356446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,1,8,power_law_1.2,1.984217643737793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,16,1,balanced,1.1065653165181477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,16,1,balanced,1.1110453605651855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,16,1,power_law_1.01,1.1646656036376952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,16,1,power_law_1.01,1.1652607917785645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,16,1,power_law_1.2,1.1681856155395507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,16,1,power_law_1.2,1.173305606842041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,2,1,balanced,2.268965403238932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,2,1,balanced,2.3243199984232583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,2,1,power_law_1.01,2.5203327178955077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,2,1,power_law_1.01,2.6007551193237304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,2,1,power_law_1.2,2.5505088806152343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,2,1,power_law_1.2,2.5548736572265627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,32,1,balanced,0.9421760241190592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,32,1,balanced,0.9433493614196777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,32,1,power_law_1.01,0.987007999420166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,32,1,power_law_1.01,0.9911231994628906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,32,1,power_law_1.2,0.9954560279846192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,32,1,power_law_1.2,0.9989952087402344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,4,1,balanced,1.7328640619913738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,4,1,balanced,1.7363252639770508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,4,1,power_law_1.01,1.8379327774047851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,4,1,power_law_1.01,1.8438655853271484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,4,1,power_law_1.2,1.8572479248046876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,4,1,power_law_1.2,1.8661632537841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,8,1,balanced,1.2769493261973064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,8,1,balanced,1.2829066912333171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,8,1,power_law_1.01,1.3488320350646972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,8,1,power_law_1.01,1.3501312255859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,8,1,power_law_1.2,1.3577919960021974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,1536,8,128,8,1,power_law_1.2,1.3584256172180176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,1,balanced,29.936752319335938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,1,balanced,30.670570373535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,1,power_law_1.01,27.43018798828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,1,power_law_1.01,27.571444702148437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,1,power_law_1.2,27.373223876953126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,1,power_law_1.2,27.878701782226564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,128,balanced,3.7742347717285156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,128,balanced,3.779904047648112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,128,power_law_1.01,4.174483108520508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,128,power_law_1.01,4.203564834594727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,128,power_law_1.2,4.545945739746093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,128,power_law_1.2,4.60492172241211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,16,balanced,5.033839861551921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,16,balanced,5.04476801554362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,16,power_law_1.01,5.466432189941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,16,power_law_1.01,5.699033737182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,16,power_law_1.2,5.812038421630859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,16,power_law_1.2,5.873638534545899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,2,balanced,16.68509292602539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,2,balanced,17.021743774414062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,2,power_law_1.01,16.309939575195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,2,power_law_1.01,16.773414611816406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,2,power_law_1.2,16.422335815429687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,2,power_law_1.2,17.04589385986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,256,balanced,3.6804478963216147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,256,balanced,3.687408129374186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,256,power_law_1.01,4.047686386108398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,256,power_law_1.01,4.059827041625977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,256,power_law_1.2,4.404550552368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,256,power_law_1.2,4.439807891845703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,32,balanced,4.308789253234863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,32,balanced,4.31275208791097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,32,power_law_1.01,4.883212661743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,32,power_law_1.01,4.8874046325683596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,32,power_law_1.2,5.251603317260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,32,power_law_1.2,5.338630294799804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,4,balanced,10.320469538370768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,4,balanced,9.878047943115234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,4,power_law_1.01,10.031327819824218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,4,power_law_1.01,10.746937561035157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,4,power_law_1.2,10.284006500244141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,4,power_law_1.2,10.622176361083984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,64,balanced,3.9538294474283853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,64,balanced,3.955205281575521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,64,power_law_1.01,4.403123092651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,64,power_law_1.01,4.45904655456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,64,power_law_1.2,4.727967834472656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,64,power_law_1.2,4.7904510498046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,8,balanced,6.505231857299805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,8,balanced,6.51038932800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,8,power_law_1.01,6.813926696777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,8,power_law_1.01,7.107462310791016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,8,power_law_1.2,7.0425666809082035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,1,8,power_law_1.2,7.6267646789550785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,16,1,balanced,8.674869537353516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,16,1,balanced,8.680730819702148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,16,1,power_law_1.01,8.216812896728516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,16,1,power_law_1.01,8.241497802734376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,16,1,power_law_1.2,8.312499237060546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,16,1,power_law_1.2,8.319840240478516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,2,1,balanced,13.490100860595703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,2,1,balanced,14.001669565836588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,2,1,power_law_1.01,13.43969268798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,2,1,power_law_1.01,13.487596130371093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,2,1,power_law_1.2,13.29516143798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,2,1,power_law_1.2,13.43719024658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,32,1,balanced,7.556970596313477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,32,1,balanced,7.574064254760742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,32,1,power_law_1.01,7.209817504882812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,32,1,power_law_1.01,7.2269950866699215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,32,1,power_law_1.2,7.317836761474609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,32,1,power_law_1.2,7.3265533447265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,4,1,balanced,25.04376475016276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,4,1,balanced,25.096923828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,4,1,power_law_1.01,25.263136291503905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,4,1,power_law_1.01,25.392819213867188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,4,1,power_law_1.2,24.739891052246094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,4,1,power_law_1.2,25.266636657714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,8,1,balanced,5.517663955688477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,8,1,balanced,5.720981597900391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,8,1,power_law_1.01,5.3511615753173825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,8,1,power_law_1.01,5.384569549560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,8,1,power_law_1.2,5.24793586730957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,4096,2688,22,512,8,1,power_law_1.2,5.410374450683594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,1,balanced,18.96324284871419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,1,balanced,19.006368001302082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,1,power_law_1.01,18.30547180175781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,1,power_law_1.01,18.49462432861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,1,power_law_1.2,18.456370544433593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,1,power_law_1.2,19.19111022949219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,2,balanced,10.378688176472982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,2,balanced,9.533952077229818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,2,power_law_1.01,11.661830139160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,2,power_law_1.01,12.729170989990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,2,power_law_1.2,13.001695251464843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,2,power_law_1.2,13.945458984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,4,balanced,5.469472249348958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,4,balanced,5.511434555053711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,4,power_law_1.01,12.16776351928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,4,power_law_1.01,12.281267547607422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,4,power_law_1.2,10.425702667236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,4,power_law_1.2,11.503059387207031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,8,balanced,3.245706558227539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,8,balanced,3.2913173039754233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,8,power_law_1.01,9.066355133056641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,8,power_law_1.01,9.148576354980468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,8,power_law_1.2,9.478585815429687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,1,8,power_law_1.2,9.538028717041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,16,1,balanced,1.2210293610890706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,16,1,balanced,1.2244640191396077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,16,1,power_law_1.01,1.2423232078552247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,16,1,power_law_1.01,1.2464256286621094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,16,1,power_law_1.2,1.2281855583190917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,16,1,power_law_1.2,1.243609619140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,2,1,balanced,8.95132827758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,2,1,balanced,8.968202590942383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,2,1,power_law_1.01,8.625465393066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,2,1,power_law_1.01,8.834425354003907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,2,1,power_law_1.2,8.628102111816407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,2,1,power_law_1.2,8.715615844726562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,32,1,balanced,0.7881866296132406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,32,1,balanced,0.7913920084635416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,32,1,power_law_1.01,0.7971839904785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,32,1,power_law_1.01,0.7985856056213378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,32,1,power_law_1.2,0.8001215934753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,32,1,power_law_1.2,0.8021504402160644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,4,1,balanced,4.212458610534668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,4,1,balanced,4.227429389953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,4,1,power_law_1.01,4.112748718261718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,4,1,power_law_1.01,4.196441650390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,4,1,power_law_1.2,4.056979370117188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,4,1,power_law_1.2,4.182009506225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,8,1,balanced,2.1376266479492188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,8,1,balanced,2.168346722920736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,8,1,power_law_1.01,2.1557695388793947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,8,1,power_law_1.01,2.173209571838379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,8,1,power_law_1.2,2.1554880142211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,16384,2,8,8,1,power_law_1.2,2.166092872619629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,1,balanced,10.708277384440104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,1,balanced,10.903925577799479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,1,power_law_1.01,11.986975860595702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,1,power_law_1.01,12.260851287841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,1,power_law_1.2,12.21564178466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,1,power_law_1.2,12.357561492919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,128,balanced,1.5107626914978027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,128,balanced,1.5143680572509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,128,power_law_1.01,1.7408639907836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,128,power_law_1.01,1.8520191192626954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,128,power_law_1.2,2.058278465270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,128,power_law_1.2,2.0788032531738283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,16,balanced,1.954319953918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,16,balanced,1.9645813306172688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,16,power_law_1.01,2.3848831176757814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,16,power_law_1.01,2.468262481689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,16,power_law_1.2,2.6573503494262694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,16,power_law_1.2,2.726598358154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,2,balanced,6.132421493530273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,2,balanced,6.155637105305989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,2,power_law_1.01,6.947763061523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,2,power_law_1.01,7.1531837463378904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,2,power_law_1.2,6.871647644042969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,2,power_law_1.2,6.980319976806641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,256,balanced,1.4831466674804688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,256,balanced,1.4893120129903157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,256,power_law_1.01,1.6961536407470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,256,power_law_1.01,1.7185792922973633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,256,power_law_1.2,1.9261568069458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,256,power_law_1.2,1.9700416564941405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,32,balanced,1.6959253946940105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,32,balanced,1.6961493492126465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,32,power_law_1.01,2.116428756713867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,32,power_law_1.01,2.193440055847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,32,power_law_1.2,2.2578432083129885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,32,power_law_1.2,2.432620811462402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,4,balanced,3.591258684794108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,4,balanced,3.59281063079834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,4,power_law_1.01,4.243251037597656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,4,power_law_1.01,4.4166912078857425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,4,power_law_1.2,4.390092849731445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,4,power_law_1.2,4.736153411865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,64,balanced,1.5740052858988445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,64,balanced,1.5788000424702961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,64,power_law_1.01,1.8423551559448241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,64,power_law_1.01,1.862950325012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,64,power_law_1.2,2.126028823852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,64,power_law_1.2,2.201644706726074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,8,balanced,2.492736021677653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,8,balanced,2.49290132522583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,8,power_law_1.01,3.012665557861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,8,power_law_1.01,3.098547172546387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,8,power_law_1.2,3.197830390930176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,1,8,power_law_1.2,3.2911617279052736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,16,1,balanced,1.671354611714681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,16,1,balanced,1.6716373761494954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,16,1,power_law_1.01,1.7903871536254883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,16,1,power_law_1.01,1.7929471969604491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,16,1,power_law_1.2,1.80316162109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,16,1,power_law_1.2,1.8039295196533203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,2,1,balanced,5.570021311442058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,2,1,balanced,5.652394612630208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,2,1,power_law_1.01,6.227155303955078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,2,1,power_law_1.01,6.295296096801758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,2,1,power_law_1.2,6.1412353515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,2,1,power_law_1.2,6.3019775390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,32,1,balanced,1.3982399304707844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,32,1,balanced,1.4001493453979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,32,1,power_law_1.01,1.5155967712402343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,32,1,power_law_1.01,1.5178943634033204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,32,1,power_law_1.2,1.5313599586486817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,32,1,power_law_1.2,1.5381695747375488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,4,1,balanced,3.195898691813151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,4,1,balanced,3.2948427200317383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,4,1,power_law_1.01,3.485977554321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,4,1,power_law_1.01,3.5290817260742187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,4,1,power_law_1.2,3.6001792907714845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,4,1,power_law_1.2,3.642630386352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,8,1,balanced,2.172741254170736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,8,1,balanced,2.176250616709391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,8,1,power_law_1.01,2.3419071197509767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,8,1,power_law_1.01,2.3464000701904295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,8,1,power_law_1.2,2.378022384643555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2048,8,256,8,1,power_law_1.2,2.379257583618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,1,balanced,12.890672047932943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,1,balanced,13.068645477294922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,1,power_law_1.01,13.46072998046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,1,power_law_1.01,13.69420166015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,1,power_law_1.2,13.583660888671876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,1,power_law_1.2,13.699948120117188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,16,balanced,2.1558879216512046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,16,balanced,2.1642932891845703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,16,power_law_1.01,2.8164480209350584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,16,power_law_1.01,2.8887935638427735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,16,power_law_1.2,3.2951934814453123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,16,power_law_1.2,3.3041408538818358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,2,balanced,6.9338029225667315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,2,balanced,7.672842661539714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,2,power_law_1.01,7.665280151367187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,2,power_law_1.01,8.16495361328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,2,power_law_1.2,8.143526458740235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,2,power_law_1.2,8.756774139404296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,32,balanced,1.8403786023457844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,32,balanced,1.8452852567036946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,32,power_law_1.01,2.3709951400756837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,32,power_law_1.01,2.4755136489868166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,32,power_law_1.2,2.824851226806641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,32,power_law_1.2,3.1396928787231446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,4,balanced,4.218981424967448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,4,balanced,4.272533416748047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,4,power_law_1.01,4.89153938293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,4,power_law_1.01,5.202323150634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,4,power_law_1.2,5.2215423583984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,4,power_law_1.2,5.286816024780274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,8,balanced,2.7957493464152017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,8,balanced,2.8100852966308594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,8,power_law_1.01,3.564108657836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,8,power_law_1.01,3.6039806365966798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,8,power_law_1.2,4.081862258911133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,1,8,power_law_1.2,4.239961624145508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,16,1,balanced,1.8791999816894531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,16,1,balanced,1.8809439341227214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,16,1,power_law_1.01,1.9403200149536133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,16,1,power_law_1.01,1.9466175079345702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,16,1,power_law_1.2,1.9618431091308595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,16,1,power_law_1.2,1.9771007537841796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,2,1,balanced,6.660624186197917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,2,1,balanced,6.840719858805339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,2,1,power_law_1.01,6.772013092041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,2,1,power_law_1.01,6.830790710449219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,2,1,power_law_1.2,6.818195343017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,2,1,power_law_1.2,7.008319854736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,32,1,balanced,1.6093759536743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,32,1,balanced,1.6109439531962078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,32,1,power_law_1.01,1.6694656372070313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,32,1,power_law_1.01,1.6714431762695312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,32,1,power_law_1.2,1.6973184585571288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,32,1,power_law_1.2,1.6986047744750976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,4,1,balanced,3.771168073018392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,4,1,balanced,3.82861328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,4,1,power_law_1.01,3.8866943359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,4,1,power_law_1.01,3.894073486328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,4,1,power_law_1.2,3.810822296142578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,4,1,power_law_1.2,3.936716842651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,8,1,balanced,2.3529760042826333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,8,1,balanced,2.4117280642191568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,8,1,power_law_1.01,2.462879943847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,8,1,power_law_1.01,2.47139835357666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,8,1,power_law_1.2,2.47325439453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,6144,2560,8,160,8,1,power_law_1.2,2.4838207244873045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,1,balanced,11.950239817301432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,1,balanced,12.49502944946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,1,power_law_1.01,13.952825927734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,1,power_law_1.01,14.38976593017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,1,power_law_1.2,14.173561096191406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,1,power_law_1.2,14.491162109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,128,balanced,1.6681599617004395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,128,balanced,1.671295960744222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,128,power_law_1.01,2.00134391784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,128,power_law_1.01,2.031372833251953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,128,power_law_1.2,2.1828927993774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,128,power_law_1.2,2.353875160217285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,16,balanced,2.1912105878194175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,16,balanced,2.197493394215902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,16,power_law_1.01,2.681222343444824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,16,power_law_1.01,2.7705408096313477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,16,power_law_1.2,3.0315391540527346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,16,power_law_1.2,3.0772031784057616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,2,balanced,6.984687805175781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,2,balanced,7.001029332478841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,2,power_law_1.01,8.134406280517577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,2,power_law_1.01,8.336505889892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,2,power_law_1.2,8.761996459960937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,2,power_law_1.2,8.846137237548827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,256,balanced,1.6339200337727864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,256,balanced,1.6442666053771973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,256,power_law_1.01,1.8681280136108398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,256,power_law_1.01,1.8948736190795898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,256,power_law_1.2,2.1665407180786134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,256,power_law_1.2,2.175001525878906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,32,balanced,1.8830347061157227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,32,balanced,1.8838720321655273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,32,power_law_1.01,2.3531455993652344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,32,power_law_1.01,2.4656448364257812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,32,power_law_1.2,2.603059196472168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,32,power_law_1.2,2.6649023056030274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,4,balanced,4.1637013753255205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,4,balanced,4.297648111979167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,4,power_law_1.01,5.155910491943359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,4,power_law_1.01,5.160326385498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,4,power_law_1.2,5.6028800964355465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,4,power_law_1.2,5.6825214385986325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,64,balanced,1.7396799723307292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,64,balanced,1.7479039827982585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,64,power_law_1.01,2.1375871658325196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,64,power_law_1.01,2.168012809753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,64,power_law_1.2,2.4510528564453127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,64,power_law_1.2,2.456991958618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,8,balanced,2.796874682108561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,8,balanced,2.8190078735351562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,8,power_law_1.01,3.528307342529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,8,power_law_1.01,3.6384639739990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,8,power_law_1.2,3.925913619995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,1,8,power_law_1.2,4.217049789428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,16,1,balanced,1.9165493647257488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,16,1,balanced,1.9232959747314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,16,1,power_law_1.01,2.0607295989990235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,16,1,power_law_1.01,2.060812759399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,16,1,power_law_1.2,2.082169532775879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,16,1,power_law_1.2,2.0905023574829102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,2,1,balanced,6.382106781005859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,2,1,balanced,6.482880274454753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,2,1,power_law_1.01,7.219257354736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,2,1,power_law_1.01,7.42608642578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,2,1,power_law_1.2,7.4159423828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,2,1,power_law_1.2,7.519731140136718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,32,1,balanced,1.6025813420613606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,32,1,balanced,1.6029386520385742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,32,1,power_law_1.01,1.7458112716674805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,32,1,power_law_1.01,1.7481279373168945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,32,1,power_law_1.2,1.7612800598144531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,32,1,power_law_1.2,1.7654016494750977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,4,1,balanced,3.730799992879232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,4,1,balanced,3.821706771850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,4,1,power_law_1.01,4.103680038452149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,4,1,power_law_1.01,4.113868713378906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,4,1,power_law_1.2,4.079545593261718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,4,1,power_law_1.2,4.237017440795898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,8,1,balanced,2.506997267405192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,8,1,balanced,2.5336532592773438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,8,1,power_law_1.01,2.7121088027954103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,8,1,power_law_1.01,2.7130559921264648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,8,1,power_law_1.2,2.7358272552490233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,256,8,1,power_law_1.2,2.753055953979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,1,balanced,13.264928181966146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,1,balanced,13.559487660725912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,1,power_law_1.01,15.701805114746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,1,power_law_1.01,15.711418151855469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,1,power_law_1.2,16.191673278808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,1,power_law_1.2,16.32030792236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,128,balanced,1.7321813901265461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,128,balanced,1.7349546750386555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,128,power_law_1.01,1.9942144393920898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,128,power_law_1.01,1.9948928833007813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,128,power_law_1.2,2.2180479049682615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,128,power_law_1.2,2.2722751617431642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,16,balanced,2.2853973706563315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,16,balanced,2.2934187253316245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,16,power_law_1.01,2.832102394104004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,16,power_law_1.01,2.864851188659668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,16,power_law_1.2,2.8786624908447265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,16,power_law_1.2,3.2024768829345702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,2,balanced,7.312933603922526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,2,balanced,7.46563720703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,2,power_law_1.01,8.717491149902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,2,power_law_1.01,8.90469741821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,2,power_law_1.2,9.26382064819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,2,power_law_1.2,9.569158172607422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,32,balanced,1.9595893224080403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,32,balanced,1.9679147402445476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,32,power_law_1.01,2.3397567749023436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,32,power_law_1.01,2.4276351928710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,32,power_law_1.2,2.55281925201416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,32,power_law_1.2,2.6416831970214845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,4,balanced,4.306362787882487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,4,balanced,4.38971741994222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,4,power_law_1.01,5.267891311645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,4,power_law_1.01,5.580748748779297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,4,power_law_1.2,5.654796981811524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,4,power_law_1.2,5.86864013671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,64,balanced,1.8066612879435222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,64,balanced,1.8097279866536458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,64,power_law_1.01,2.114348793029785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,64,power_law_1.01,2.117977523803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,64,power_law_1.2,2.2703039169311525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,64,power_law_1.2,2.335327911376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,8,balanced,2.9357385635375977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,8,balanced,2.956853230794271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,8,power_law_1.01,3.5945919036865233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,8,power_law_1.01,3.6745086669921876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,8,power_law_1.2,3.814227294921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,1,8,power_law_1.2,4.1123710632324215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,16,1,balanced,2.007317384084066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,16,1,balanced,2.0133066177368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,16,1,power_law_1.01,2.2079999923706053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,16,1,power_law_1.01,2.219539260864258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,16,1,power_law_1.2,2.2647104263305664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,16,1,power_law_1.2,2.273907279968262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,2,1,balanced,7.070682525634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,2,1,balanced,7.099573135375977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,2,1,power_law_1.01,8.203488159179688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,2,1,power_law_1.01,8.4166015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,2,1,power_law_1.2,8.22052459716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,2,1,power_law_1.2,8.227263641357421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,32,1,balanced,1.6719679832458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,32,1,balanced,1.6730292638142903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,32,1,power_law_1.01,1.8505664825439454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,32,1,power_law_1.01,1.8557184219360352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,32,1,power_law_1.2,1.8764095306396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,32,1,power_law_1.2,1.8826879501342773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,4,1,balanced,3.914815902709961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,4,1,balanced,4.042661348978679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,4,1,power_law_1.01,4.584371185302734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,4,1,power_law_1.01,4.64136962890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,4,1,power_law_1.2,4.569798278808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,4,1,power_law_1.2,4.764601516723633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,8,1,balanced,2.6204427083333335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,8,1,balanced,2.633514722188314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,8,1,power_law_1.01,2.943846321105957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,8,1,power_law_1.01,2.9559999465942384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,8,1,power_law_1.2,3.0249151229858398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,12288,7168,2048,8,384,8,1,power_law_1.2,3.0361600875854493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,1,balanced,0.21140267451604208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,1,balanced,0.21213332811991373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,1,power_law_1.01,0.19930880069732665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,1,power_law_1.01,0.20173439979553223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,1,power_law_1.2,0.2081279993057251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,1,power_law_1.2,0.211027193069458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,128,balanced,0.04350399971008301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,128,balanced,0.04355733096599579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,128,power_law_1.01,0.041920000314712526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,128,power_law_1.01,0.042208001017570496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,128,power_law_1.2,0.041484799981117246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,128,power_law_1.2,0.04176000058650971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,16,balanced,0.05123200019200643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,16,balanced,0.05205333232879639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,16,power_law_1.01,0.047788798809051514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,16,power_law_1.01,0.05118079781532288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,16,power_law_1.2,0.04965760111808777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,16,power_law_1.2,0.05233280062675476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,2,balanced,0.13725866874059042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,2,balanced,0.1418400009473165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,2,power_law_1.01,0.1298624038696289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,2,power_law_1.01,0.1306496024131775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,2,power_law_1.2,0.12735359668731688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,2,power_law_1.2,0.13346560001373292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,32,balanced,0.043882668018341064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,32,balanced,0.043920000394185386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,32,power_law_1.01,0.04349440038204193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,32,power_law_1.01,0.043609601259231565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,32,power_law_1.2,0.043244799971580504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,32,power_law_1.2,0.04397439956665039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,4,balanced,0.08826133608818054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,4,balanced,0.08851733803749084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,4,power_law_1.01,0.08478080034255982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,4,power_law_1.01,0.08531839847564697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,4,power_law_1.2,0.08398079872131348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,4,power_law_1.2,0.08684160113334656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,64,balanced,0.04381333291530609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,64,balanced,0.04388799766699473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,64,power_law_1.01,0.04222080111503601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,64,power_law_1.01,0.04325760006904602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,64,power_law_1.2,0.04232960045337677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,64,power_law_1.2,0.042796799540519716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,8,balanced,0.06461866696675618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,8,balanced,0.06629333396752675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,8,power_law_1.01,0.06270080208778381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,8,power_law_1.01,0.063155198097229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,8,power_law_1.2,0.06215680241584778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,1,8,power_law_1.2,0.06369280219078063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,2,1,balanced,0.13523733615875244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,2,1,balanced,0.13588266571362814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,2,1,power_law_1.01,0.12894079685211182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,2,1,power_law_1.01,0.1302783966064453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,2,1,power_law_1.2,0.12951040267944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,2,1,power_law_1.2,0.13003519773483277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,4,1,balanced,0.08785067001978557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,4,1,balanced,0.08892800410588582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,4,1,power_law_1.01,0.0838271975517273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,4,1,power_law_1.01,0.08572160005569458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,4,1,power_law_1.2,0.08469120264053345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2048,768,8,128,4,1,power_law_1.2,0.08514559864997864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,1,balanced,0.5836213429768881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,1,balanced,0.5885226726531982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,1,power_law_1.01,0.5375232219696044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,1,power_law_1.01,0.5382783889770508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,1,power_law_1.2,0.5564991950988769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,1,power_law_1.2,0.5645567893981933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,128,balanced,0.05659733215967814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,128,balanced,0.056794668237368263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,128,power_law_1.01,0.05550079941749573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,128,power_law_1.01,0.05578240156173706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,128,power_law_1.2,0.05568000078201294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,128,power_law_1.2,0.05626239776611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,16,balanced,0.0823466678460439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,16,balanced,0.08237333099047343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,16,power_law_1.01,0.0797760009765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,16,power_law_1.01,0.08087040185928344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,16,power_law_1.2,0.0794431984424591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,16,power_law_1.2,0.08115199804306031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,2,balanced,0.35585065682729083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,2,balanced,0.36076800028483075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,2,power_law_1.01,0.31612799167633054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,2,power_law_1.01,0.3189120054244995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,2,power_law_1.2,0.3117824077606201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,2,power_law_1.2,0.3210560083389282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,32,balanced,0.07202666501204173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,32,balanced,0.07249600191911061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,32,power_law_1.01,0.06995840072631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,32,power_law_1.01,0.0701312005519867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,32,power_law_1.2,0.06989439725875854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,32,power_law_1.2,0.07011200189590454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,4,balanced,0.20625599225362143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,4,balanced,0.20736533403396606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,4,power_law_1.01,0.1880128026008606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,4,power_law_1.01,0.1885823965072632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,4,power_law_1.2,0.1896064043045044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,4,power_law_1.2,0.1923200011253357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,64,balanced,0.05807466804981232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,64,balanced,0.05859733124574026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,64,power_law_1.01,0.0575872004032135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,64,power_law_1.01,0.05801600217819214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,64,power_law_1.2,0.057158398628234866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,64,power_law_1.2,0.05746560096740723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,8,balanced,0.1276586651802063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,8,balanced,0.12865066528320312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,8,power_law_1.01,0.12000000476837158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,8,power_law_1.01,0.12036479711532592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,8,power_law_1.2,0.12167680263519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,1,8,power_law_1.2,0.12425600290298462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,16,1,balanced,0.2609333395957947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,16,1,balanced,0.26128532489140827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,16,1,power_law_1.01,0.23354880809783934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,16,1,power_law_1.01,0.23717119693756103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,16,1,power_law_1.2,0.23646080493927002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,16,1,power_law_1.2,0.23787519931793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,2,1,balanced,0.34920533498128253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,2,1,balanced,0.35157867272694904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,2,1,power_law_1.01,0.3113600015640259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,2,1,power_law_1.01,0.31868801116943357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,2,1,power_law_1.2,0.31249279975891114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,2,1,power_law_1.2,0.31639680862426756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,32,1,balanced,0.1891146699587504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,32,1,balanced,0.18923733631769815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,32,1,power_law_1.01,0.1649791955947876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,32,1,power_law_1.01,0.16839040517807008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,32,1,power_law_1.2,0.17407360076904296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,32,1,power_law_1.2,0.17433600425720214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,4,1,balanced,0.2071839968363444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,4,1,balanced,0.2095306714375814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,4,1,power_law_1.01,0.19061119556427003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,4,1,power_law_1.01,0.1969151973724365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,4,1,power_law_1.2,0.1901247978210449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,4,1,power_law_1.2,0.19530240297317505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,8,1,balanced,0.4134026765823364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,8,1,balanced,0.4134666522343953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,8,1,power_law_1.01,0.36074879169464114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,8,1,power_law_1.01,0.379366397857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,8,1,power_law_1.2,0.380947208404541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,2688,1856,6,128,8,1,power_law_1.2,0.3826495885848999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,1,balanced,1.1508106390635173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,1,balanced,1.1648906866709392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,1,power_law_1.01,0.9286848068237304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,1,power_law_1.01,0.9441663742065429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,1,power_law_1.2,0.931430435180664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,1,power_law_1.2,0.9432895660400391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,128,balanced,0.08844266335169475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,128,balanced,0.08853866656621297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,128,power_law_1.01,0.08634240031242371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,128,power_law_1.01,0.08711040019989014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,128,power_law_1.2,0.0864192008972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,128,power_law_1.2,0.08701440095901489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,16,balanced,0.1471680005391439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,16,balanced,0.14850133657455444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,16,power_law_1.01,0.12603520154953002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,16,power_law_1.01,0.13156479597091675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,16,power_law_1.2,0.12335360050201416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,16,power_law_1.2,0.13660160303115845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,2,balanced,0.6083146731058756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,2,balanced,0.6133439938227335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,2,power_law_1.01,0.5164927959442138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,2,power_law_1.01,0.5373951911926269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,2,power_law_1.2,0.5139520168304443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,2,power_law_1.2,0.52773118019104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,256,balanced,0.0867786705493927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,256,balanced,0.0885813335577647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,256,power_law_1.01,0.08565120100975036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,256,power_law_1.01,0.08589439988136291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,256,power_law_1.2,0.08551679849624634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,256,power_law_1.2,0.08608639836311341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,32,balanced,0.10108266274134318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,32,balanced,0.1011199951171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,32,power_law_1.01,0.09916800260543823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,32,power_law_1.01,0.09919360280036926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,32,power_law_1.2,0.09734399914741516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,32,power_law_1.2,0.09783679842948914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,4,balanced,0.3478399912516276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,4,balanced,0.3519146839777629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,4,power_law_1.01,0.30341761112213134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,4,power_law_1.01,0.3195136070251465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,4,power_law_1.2,0.29282560348510744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,4,power_law_1.2,0.31877760887145995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,64,balanced,0.09490666786829631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,64,balanced,0.09499200185139973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,64,power_law_1.01,0.0918079972267151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,64,power_law_1.01,0.0919871985912323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,64,power_law_1.2,0.09189119935035706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,64,power_law_1.2,0.09208319783210754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,8,balanced,0.2097760041554769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,8,balanced,0.21178666750590006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,8,power_law_1.01,0.19070080518722535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,8,power_law_1.01,0.1959231972694397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,8,power_law_1.2,0.18877439498901366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,1,8,power_law_1.2,0.19322880506515502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,16,1,balanced,0.1663146714369456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,16,1,balanced,0.16660799582799277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,16,1,power_law_1.01,0.13013119697570802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,16,1,power_law_1.01,0.1351359963417053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,16,1,power_law_1.2,0.1295040011405945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,16,1,power_law_1.2,0.13000960350036622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,2,1,balanced,0.6027573347091675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,2,1,balanced,0.6029333273569742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,2,1,power_law_1.01,0.5033599853515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,2,1,power_law_1.01,0.5090176105499268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,2,1,power_law_1.2,0.49799041748046874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,2,1,power_law_1.2,0.49933438301086425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,32,1,balanced,0.12141866485277812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,32,1,balanced,0.12148267030715942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,32,1,power_law_1.01,0.11167360544204712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,32,1,power_law_1.01,0.11189119815826416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,32,1,power_law_1.2,0.11075839996337891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,32,1,power_law_1.2,0.11219199895858764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,4,1,balanced,0.3387146790822347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,4,1,balanced,0.34014399846394855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,4,1,power_law_1.01,0.28345599174499514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,4,1,power_law_1.01,0.28478078842163085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,4,1,power_law_1.2,0.2807168006896973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,4,1,power_law_1.2,0.2816384077072144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,8,1,balanced,0.20578134059906006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,8,1,balanced,0.2079733411471049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,8,1,power_law_1.01,0.18465280532836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,8,1,power_law_1.01,0.18506239652633666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,8,1,power_law_1.2,0.18302079439163207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,3072,1536,8,256,8,1,power_law_1.2,0.18403199911117554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,1,balanced,0.5054293473561605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,1,balanced,0.5054719845453898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,1,power_law_1.01,0.525491189956665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,1,power_law_1.01,0.5352128028869629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,1,power_law_1.2,0.5169663906097413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,1,power_law_1.2,0.5238976001739502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,2,balanced,0.3304160038630168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,2,balanced,0.33088000615437824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,2,power_law_1.01,0.3367552042007446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,2,power_law_1.01,0.3421504020690918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,2,power_law_1.2,0.34515841007232667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,2,power_law_1.2,0.3505280017852783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,4,balanced,0.246288001537323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,4,balanced,0.2516160011291504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,4,power_law_1.01,0.2544384002685547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,4,power_law_1.01,0.2593024015426636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,4,power_law_1.2,0.25936639308929443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,4,power_law_1.2,0.2600127935409546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,8,balanced,0.19334399700164795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,8,balanced,0.19350934028625488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,8,power_law_1.01,0.21683199405670167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,8,power_law_1.01,0.219321608543396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,8,power_law_1.2,0.2188352108001709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,1,8,power_law_1.2,0.21921920776367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,16,1,balanced,0.07526933153470357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,16,1,balanced,0.0763626645008723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,16,1,power_law_1.01,0.07332479953765869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,16,1,power_law_1.01,0.07365120053291321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,16,1,power_law_1.2,0.0723904013633728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,16,1,power_law_1.2,0.07320320010185241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,2,1,balanced,0.2810399929682414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,2,1,balanced,0.2834133307139079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,2,1,power_law_1.01,0.2794111967086792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,2,1,power_law_1.01,0.2817280054092407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,2,1,power_law_1.2,0.2814143896102905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,2,1,power_law_1.2,0.2821376085281372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,32,1,balanced,0.059205333391825356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,32,1,balanced,0.05971199770768484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,32,1,power_law_1.01,0.060198402404785155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,32,1,power_law_1.01,0.061939197778701785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,32,1,power_law_1.2,0.060288000106811526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,32,1,power_law_1.2,0.060812801122665405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,4,1,balanced,0.1701386570930481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,4,1,balanced,0.1730453372001648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,4,1,power_law_1.01,0.16543359756469728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,4,1,power_law_1.01,0.16620800495147706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,4,1,power_law_1.2,0.16624000072479247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,4,1,power_law_1.2,0.1662976026535034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,8,1,balanced,0.09823999802271526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,8,1,balanced,0.09866666793823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,8,1,power_law_1.01,0.09304959774017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,8,1,power_law_1.01,0.09505280256271362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,8,1,power_law_1.2,0.09436799883842469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,14336,2,8,8,1,power_law_1.2,0.09496319890022278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,1,balanced,0.779088020324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,1,balanced,0.7808372974395752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,1,power_law_1.01,0.7392831802368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,1,power_law_1.01,0.7439295768737793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,1,power_law_1.2,0.7503551959991455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,1,power_law_1.2,0.7509247779846191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,128,balanced,0.06617600222428639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,128,balanced,0.0664106657107671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,128,power_law_1.01,0.06450560092926025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,128,power_law_1.01,0.0664192020893097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,128,power_law_1.2,0.06429439783096313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,128,power_law_1.2,0.06440320014953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,16,balanced,0.1039520005385081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,16,balanced,0.10414933164914449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,16,power_law_1.01,0.09879040122032165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,16,power_law_1.01,0.10122879743576049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,16,power_law_1.2,0.10165120363235473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,16,power_law_1.2,0.10168319940567017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,2,balanced,0.42496001720428467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,2,balanced,0.4262239933013916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,2,power_law_1.01,0.4142399787902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,2,power_law_1.01,0.4142464160919189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,2,power_law_1.2,0.4009727954864502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,2,power_law_1.2,0.42087678909301757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,32,balanced,0.09063466389973958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,32,balanced,0.09096533060073853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,32,power_law_1.01,0.08828160166740417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,32,power_law_1.01,0.08889600038528442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,32,power_law_1.2,0.0867904007434845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,32,power_law_1.2,0.08837119936943054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,4,balanced,0.23958933353424072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,4,balanced,0.24022400379180908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,4,power_law_1.01,0.2309056043624878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,4,power_law_1.01,0.2339263916015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,4,power_law_1.2,0.23756799697875977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,4,power_law_1.2,0.23970561027526854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,64,balanced,0.08070933322111766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,64,balanced,0.08261866867542267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,64,power_law_1.01,0.077920001745224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,64,power_law_1.01,0.07899519801139832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,64,power_law_1.2,0.0775488018989563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,64,power_law_1.2,0.0791808009147644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,8,balanced,0.1525173286596934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,8,balanced,0.15433067083358765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,8,power_law_1.01,0.14529919624328613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,8,power_law_1.01,0.14608000516891478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,8,power_law_1.2,0.14595199823379518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,1,8,power_law_1.2,0.14967039823532105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,16,1,balanced,0.11914666493733723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,16,1,balanced,0.11930132905642192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,16,1,power_law_1.01,0.11409920454025269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,16,1,power_law_1.01,0.1143231987953186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,16,1,power_law_1.2,0.11396479606628418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,16,1,power_law_1.2,0.1146880030632019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,2,1,balanced,0.3903786738713582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,2,1,balanced,0.39348268508911133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,2,1,power_law_1.01,0.37008640766143797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,2,1,power_law_1.01,0.37311999797821044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,2,1,power_law_1.2,0.3849152088165283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,2,1,power_law_1.2,0.40570878982543945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,32,1,balanced,0.10341333349545796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,32,1,balanced,0.10469333330790202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,32,1,power_law_1.01,0.09996799826622009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,32,1,power_law_1.01,0.10073599815368653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,32,1,power_law_1.2,0.1007040023803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,32,1,power_law_1.2,0.10117759704589843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,4,1,balanced,0.23593066136042276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,4,1,balanced,0.23669334252675375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,4,1,power_law_1.01,0.2261120080947876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,4,1,power_law_1.01,0.2284543991088867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,4,1,power_law_1.2,0.2278656005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,4,1,power_law_1.2,0.2313215970993042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,8,1,balanced,0.15031466881434122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,8,1,balanced,0.15081600348154703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,8,1,power_law_1.01,0.14420479536056519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,8,1,power_law_1.01,0.14436479806900024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,8,1,power_law_1.2,0.1441472053527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,1536,8,128,8,1,power_law_1.2,0.14449280500411987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,1,balanced,5.172863960266113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,1,balanced,5.216058731079102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,1,power_law_1.01,4.597779083251953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,1,power_law_1.01,4.618080139160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,1,power_law_1.2,4.566521453857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,1,power_law_1.2,4.762828826904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,128,balanced,0.25667200485865277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,128,balanced,0.25872000058492023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,128,power_law_1.01,0.25477759838104247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,128,power_law_1.01,0.2560447931289673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,128,power_law_1.2,0.2547904014587402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,128,power_law_1.2,0.2554624080657959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,16,balanced,0.5581706762313843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,16,balanced,0.5595893462498983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,16,power_law_1.01,0.5200384140014649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,16,power_law_1.01,0.5325376033782959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,16,power_law_1.2,0.52609281539917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,16,power_law_1.2,0.5312960147857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,2,balanced,2.6974719365437827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,2,balanced,2.749349276224772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,2,power_law_1.01,2.3490047454833984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,2,power_law_1.01,2.414944076538086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,2,power_law_1.2,2.3971967697143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,2,power_law_1.2,2.4406911849975588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,256,balanced,0.24861333767573038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,256,balanced,0.250602662563324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,256,power_law_1.01,0.24697599411010743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,256,power_law_1.01,0.24714241027832032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,256,power_law_1.2,0.24734721183776856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,256,power_law_1.2,0.2477184057235718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,32,balanced,0.39044801394144696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,32,balanced,0.3936213254928589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,32,power_law_1.01,0.3764096021652222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,32,power_law_1.01,0.38000640869140623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,32,power_law_1.2,0.37260799407958983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,32,power_law_1.2,0.38750081062316893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,4,balanced,1.4745333989461262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,4,balanced,1.4883839289347331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,4,power_law_1.01,1.327564811706543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,4,power_law_1.01,1.3364288330078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,4,power_law_1.2,1.3184127807617188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,4,power_law_1.2,1.3339455604553223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,64,balanced,0.2913813392321269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,64,balanced,0.29315733909606934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,64,power_law_1.01,0.28440959453582765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,64,power_law_1.01,0.2910271883010864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,64,power_law_1.2,0.28460159301757815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,64,power_law_1.2,0.28885760307312014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,8,balanced,0.8625973065694174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,8,balanced,0.8628266652425131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,8,power_law_1.01,0.7956031799316406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,8,power_law_1.01,0.8203200340270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,8,power_law_1.2,0.7814464092254638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,1,8,power_law_1.2,0.8095232009887695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,16,1,balanced,1.7109707196553547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,16,1,balanced,1.712949275970459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,16,1,power_law_1.01,1.5171327590942383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,16,1,power_law_1.01,1.519545555114746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,16,1,power_law_1.2,1.5360511779785155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,16,1,power_law_1.2,1.5409664154052733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,2,1,balanced,2.465775966644287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,2,1,balanced,2.4707253774007163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,2,1,power_law_1.01,2.1395263671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,2,1,power_law_1.01,2.1683135986328126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,2,1,power_law_1.2,2.1876928329467775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,2,1,power_law_1.2,2.202079963684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,32,1,balanced,1.3090133666992188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,32,1,balanced,1.3090346654256184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,32,1,power_law_1.01,1.1596863746643067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,32,1,power_law_1.01,1.161017608642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,32,1,power_law_1.2,1.1617600440979003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,32,1,power_law_1.2,1.1911808013916017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,4,1,balanced,1.3728000322977703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,4,1,balanced,1.3785600662231445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,4,1,power_law_1.01,1.2256640434265136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,4,1,power_law_1.01,1.2266752243041992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,4,1,power_law_1.2,1.2428607940673828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,4,1,power_law_1.2,1.2587136268615722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,8,1,balanced,0.7743306954701742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,8,1,balanced,0.7792747020721436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,8,1,power_law_1.01,0.7026559829711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,8,1,power_law_1.01,0.7051263809204101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,8,1,power_law_1.2,0.7068480014801025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,4096,2688,22,512,8,1,power_law_1.2,0.7192959785461426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,1,balanced,0.78493865331014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,1,balanced,0.7888639767964681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,1,power_law_1.01,0.8835200309753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,1,power_law_1.01,0.9003520011901855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,1,power_law_1.2,0.8829695701599121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,1,power_law_1.2,0.890169620513916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,2,balanced,0.4763360023498535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,2,balanced,0.4772160053253174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,2,power_law_1.01,0.4915008068084717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,2,power_law_1.01,0.5064191818237305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,2,power_law_1.2,0.49260802268981935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,2,power_law_1.2,0.5299839973449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,4,balanced,0.329802672068278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,4,balanced,0.33078932762145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,4,power_law_1.01,0.3453183889389038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,4,power_law_1.01,0.34783999919891356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,4,power_law_1.2,0.3353087902069092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,4,power_law_1.2,0.34381439685821535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,8,balanced,0.2409013311068217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,8,balanced,0.24225066105524698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,8,power_law_1.01,0.28669440746307373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,8,power_law_1.01,0.2868160009384155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,8,power_law_1.2,0.2769536018371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,1,8,power_law_1.2,0.2879296064376831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,16,1,balanced,0.1011306643486023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,16,1,balanced,0.10186666250228882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,16,1,power_law_1.01,0.10153599977493286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,16,1,power_law_1.01,0.10472320318222046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,16,1,power_law_1.2,0.10061440467834473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,16,1,power_law_1.2,0.10442240238189697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,2,1,balanced,0.43231467405955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,2,1,balanced,0.434224009513855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,2,1,power_law_1.01,0.42110719680786135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,2,1,power_law_1.01,0.4287168025970459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,2,1,power_law_1.2,0.4347519874572754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,2,1,power_law_1.2,0.4454016208648682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,32,1,balanced,0.08611733714739482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,32,1,balanced,0.08679466446240743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,32,1,power_law_1.01,0.08804479837417603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,32,1,power_law_1.01,0.09034879803657532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,32,1,power_law_1.2,0.085971200466156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,32,1,power_law_1.2,0.0886080026626587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,4,1,balanced,0.2537813385327657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,4,1,balanced,0.2610666751861572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,4,1,power_law_1.01,0.25347199440002444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,4,1,power_law_1.01,0.25661439895629884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,4,1,power_law_1.2,0.24413440227508545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,4,1,power_law_1.2,0.26371839046478274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,8,1,balanced,0.13421333829561868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,8,1,balanced,0.13913066188494363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,8,1,power_law_1.01,0.13920639753341674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,8,1,power_law_1.01,0.14106240272521972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,8,1,power_law_1.2,0.13496320247650145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,16384,2,8,8,1,power_law_1.2,0.1403712034225464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,1,balanced,2.9551518758138022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,1,balanced,3.121077219645182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,1,power_law_1.01,2.4284479141235353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,1,power_law_1.01,2.442451286315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,1,power_law_1.2,2.4508735656738283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,1,power_law_1.2,2.4882816314697265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,128,balanced,0.15036799510320029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,128,balanced,0.1506666640440623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,128,power_law_1.01,0.14844160079956054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,128,power_law_1.01,0.14871679544448851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,128,power_law_1.2,0.147871994972229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,128,power_law_1.2,0.14876799583435057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,16,balanced,0.31066666046778363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,16,balanced,0.31176533301671344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,16,power_law_1.01,0.270412802696228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,16,power_law_1.01,0.2852544069290161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,16,power_law_1.2,0.2913856029510498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,16,power_law_1.2,0.29160959720611573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,2,balanced,1.5519626935323079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,2,balanced,1.5824426015218098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,2,power_law_1.01,1.2465344429016114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,2,power_law_1.01,1.2749504089355468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,2,power_law_1.2,1.2782079696655273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,2,power_law_1.2,1.2980095863342285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,256,balanced,0.13800000150998434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,256,balanced,0.13965866963068643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,256,power_law_1.01,0.13583999872207642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,256,power_law_1.01,0.13886719942092896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,256,power_law_1.2,0.1366976022720337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,256,power_law_1.2,0.13815679550170898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,32,balanced,0.19779199361801147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,32,balanced,0.19824532667795816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,32,power_law_1.01,0.1824447989463806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,32,power_law_1.01,0.18908159732818602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,32,power_law_1.2,0.189683198928833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,32,power_law_1.2,0.19033600091934205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,4,balanced,0.8270933628082275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,4,balanced,0.8271733125050863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,4,power_law_1.01,0.7247744083404541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,4,power_law_1.01,0.724889612197876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,4,power_law_1.2,0.7058815956115723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,4,power_law_1.2,0.7367360115051269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,64,balanced,0.15889599919319153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,64,balanced,0.15989333391189575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,64,power_law_1.01,0.1569983959197998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,64,power_law_1.01,0.15700479745864868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,64,power_law_1.2,0.15475200414657592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,64,power_law_1.2,0.15565439462661743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,8,balanced,0.48109865188598633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,8,balanced,0.48511465390523273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,8,power_law_1.01,0.4365375995635986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,8,power_law_1.01,0.4425471782684326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,8,power_law_1.2,0.41064958572387694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,1,8,power_law_1.2,0.41548800468444824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,16,1,balanced,0.3240639964739482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,16,1,balanced,0.32518933216730755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,16,1,power_law_1.01,0.25289599895477294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,16,1,power_law_1.01,0.25411200523376465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,16,1,power_law_1.2,0.25484158992767336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,16,1,power_law_1.2,0.2556159973144531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,2,1,balanced,1.540346622467041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,2,1,balanced,1.5543947219848633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,2,1,power_law_1.01,1.2634048461914062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,2,1,power_law_1.01,1.2761664390563965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,2,1,power_law_1.2,1.262758445739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,2,1,power_law_1.2,1.297804832458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,32,1,balanced,0.22452799479166666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,32,1,balanced,0.22554665803909302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,32,1,power_law_1.01,0.20604801177978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,32,1,power_law_1.01,0.20677120685577394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,32,1,power_law_1.2,0.2074496030807495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,32,1,power_law_1.2,0.20767359733581542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,4,1,balanced,0.8009386857350668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,4,1,balanced,0.8015680313110352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,4,1,power_law_1.01,0.6617152214050293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,4,1,power_law_1.01,0.6684800148010254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,4,1,power_law_1.2,0.6645952224731445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,4,1,power_law_1.2,0.6764416217803955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,8,1,balanced,0.4734506607055664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,8,1,balanced,0.47470398743947345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,8,1,power_law_1.01,0.3855743885040283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,8,1,power_law_1.01,0.38664319515228274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,8,1,power_law_1.2,0.38518400192260743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2048,8,256,8,1,power_law_1.2,0.3880511999130249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,1,balanced,2.328767935434977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,1,balanced,2.3407252629597983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,1,power_law_1.01,2.1369792938232424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,1,power_law_1.01,2.1429887771606446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,1,power_law_1.2,2.155276870727539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,1,power_law_1.2,2.176371192932129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,16,balanced,0.23746132850646973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,16,balanced,0.23760000864664713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,16,power_law_1.01,0.22074880599975585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,16,power_law_1.01,0.2211456060409546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,16,power_law_1.2,0.22045440673828126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,16,power_law_1.2,0.22503039836883545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,2,balanced,1.2434240182240803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,2,balanced,1.2531147003173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,2,power_law_1.01,1.0822976112365723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,2,power_law_1.01,1.0908032417297364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,2,power_law_1.2,1.1150527954101563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,2,power_law_1.2,1.1278271675109863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,32,balanced,0.151637335618337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,32,balanced,0.15227199594179788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,32,power_law_1.01,0.14691840410232543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,32,power_law_1.01,0.14948480129241942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,32,power_law_1.2,0.14729599952697753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,32,power_law_1.2,0.1495743989944458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,4,balanced,0.6509333451588949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,4,balanced,0.6517920096715292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,4,power_law_1.01,0.6174975872039795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,4,power_law_1.01,0.6266496181488037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,4,power_law_1.2,0.6109632015228271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,4,power_law_1.2,0.6151552200317383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,8,balanced,0.36740267276763916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,8,balanced,0.36760000387827557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,8,power_law_1.01,0.34013440608978274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,8,power_law_1.01,0.3478656053543091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,8,power_law_1.2,0.3440576076507568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,1,8,power_law_1.2,0.3509887933731079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,16,1,balanced,0.26553066571553546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,16,1,balanced,0.26662399371465045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,16,1,power_law_1.01,0.2105855941772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,16,1,power_law_1.01,0.22086400985717775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,16,1,power_law_1.2,0.22970240116119384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,16,1,power_law_1.2,0.23291521072387694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,2,1,balanced,1.209941307703654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,2,1,balanced,1.2244799931844075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,2,1,power_law_1.01,1.0937536239624024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,2,1,power_law_1.01,1.1083840370178222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,2,1,power_law_1.2,1.1224191665649415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,2,1,power_law_1.2,1.1254719734191894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,32,1,balanced,0.18295466899871826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,32,1,balanced,0.18440532684326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,32,1,power_law_1.01,0.1736448049545288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,32,1,power_law_1.01,0.17393920421600342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,32,1,power_law_1.2,0.17597440481185914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,32,1,power_law_1.2,0.17658239603042603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,4,1,balanced,0.6395893494288126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,4,1,balanced,0.6415306727091471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,4,1,power_law_1.01,0.5977280139923096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,4,1,power_law_1.01,0.5987008094787598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,4,1,power_law_1.2,0.6009151935577393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,4,1,power_law_1.2,0.6090176105499268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,8,1,balanced,0.35859731833140057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,8,1,balanced,0.3588426510492961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,8,1,power_law_1.01,0.3328511953353882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,8,1,power_law_1.01,0.3379519939422607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,8,1,power_law_1.2,0.33946239948272705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,6144,2560,8,160,8,1,power_law_1.2,0.33992319107055663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,1,balanced,3.460224151611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,1,balanced,3.4702345530192056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,1,power_law_1.01,2.844812774658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,1,power_law_1.01,2.9091136932373045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,1,power_law_1.2,2.8533632278442385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,1,power_law_1.2,2.900172805786133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,128,balanced,0.17082132895787558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,128,balanced,0.17297599713007608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,128,power_law_1.01,0.1691648006439209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,128,power_law_1.01,0.1699136018753052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,128,power_law_1.2,0.1689919948577881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,128,power_law_1.2,0.16999679803848267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,16,balanced,0.36901867389678955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,16,balanced,0.372106671333313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,16,power_law_1.01,0.3279551982879639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,16,power_law_1.01,0.3309823989868164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,16,power_law_1.2,0.3226239919662476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,16,power_law_1.2,0.32934401035308836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,2,balanced,1.8547946612040203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,2,balanced,1.8608640034993489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,2,power_law_1.01,1.5320768356323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,2,power_law_1.01,1.5420160293579102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,2,power_law_1.2,1.5072704315185548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,2,power_law_1.2,1.512019157409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,256,balanced,0.1625866691271464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,256,balanced,0.1646880010763804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,256,power_law_1.01,0.1604864001274109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,256,power_law_1.01,0.16307200193405152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,256,power_law_1.2,0.1598080039024353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,256,power_law_1.2,0.16250879764556886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,32,balanced,0.23423999547958374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,32,balanced,0.23430933554967245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,32,power_law_1.01,0.21923201084136962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,32,power_law_1.01,0.22910079956054688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,32,power_law_1.2,0.22434558868408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,32,power_law_1.2,0.22565760612487792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,4,balanced,0.9669439792633057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,4,balanced,0.9670506318410238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,4,power_law_1.01,0.8252415657043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,4,power_law_1.01,0.836678409576416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,4,power_law_1.2,0.8246975898742676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,4,power_law_1.2,0.8458815574645996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,64,balanced,0.180458664894104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,64,balanced,0.1809813380241394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,64,power_law_1.01,0.17942399978637696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,64,power_law_1.01,0.17946879863739013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,64,power_law_1.2,0.17517440319061278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,64,power_law_1.2,0.17748479843139647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,8,balanced,0.5664960145950317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,8,balanced,0.5709653298060099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,8,power_law_1.01,0.4733759880065918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,8,power_law_1.01,0.503059196472168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,8,power_law_1.2,0.5295743942260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,1,8,power_law_1.2,0.5320831775665283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,16,1,balanced,0.37571199735005695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,16,1,balanced,0.3763146797815959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,16,1,power_law_1.01,0.2916863918304443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,16,1,power_law_1.01,0.2961344003677368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,16,1,power_law_1.2,0.2907711982727051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,16,1,power_law_1.2,0.2938816070556641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,2,1,balanced,1.8076319694519043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,2,1,balanced,1.8570079803466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,2,1,power_law_1.01,1.4709888458251954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,2,1,power_law_1.01,1.4961983680725097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,2,1,power_law_1.2,1.4758784294128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,2,1,power_law_1.2,1.4928959846496581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,32,1,balanced,0.257749338944753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,32,1,balanced,0.258245329062144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,32,1,power_law_1.01,0.23479681015014647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,32,1,power_law_1.01,0.23538560867309571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,32,1,power_law_1.2,0.23386878967285157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,32,1,power_law_1.2,0.23639678955078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,4,1,balanced,0.9333653450012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,4,1,balanced,0.9350986480712891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,4,1,power_law_1.01,0.7756800174713134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,4,1,power_law_1.01,0.7809279918670654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,4,1,power_law_1.2,0.775987195968628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,4,1,power_law_1.2,0.7772287845611572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,8,1,balanced,0.552074670791626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,8,1,balanced,0.55458664894104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,8,1,power_law_1.01,0.44581117630004885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,8,1,power_law_1.01,0.4482624053955078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,8,1,power_law_1.2,0.4414976119995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,256,8,1,power_law_1.2,0.4555520057678223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,1,balanced,5.374037424723308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,1,balanced,5.378682454427083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,1,power_law_1.01,3.8788928985595703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,1,power_law_1.01,3.912070465087891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,1,power_law_1.2,3.840595245361328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,1,power_law_1.2,3.857990264892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,128,balanced,0.21363200743993124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,128,balanced,0.21387199560801187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,128,power_law_1.01,0.21067519187927247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,128,power_law_1.01,0.2114176034927368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,128,power_law_1.2,0.2099071979522705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,128,power_law_1.2,0.21114881038665773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,16,balanced,0.49354668458302814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,16,balanced,0.4935733477274577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,16,power_law_1.01,0.45350399017333987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,16,power_law_1.01,0.46968960762023926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,16,power_law_1.2,0.4478784084320068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,16,power_law_1.2,0.460646390914917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,2,balanced,2.7416747411092124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,2,balanced,2.7564798990885415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,2,power_law_1.01,2.0010175704956055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,2,power_law_1.01,2.081817626953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,2,power_law_1.2,1.9618431091308595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,2,power_law_1.2,2.1229120254516602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,32,balanced,0.3354560136795044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,32,balanced,0.33613332112630206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,32,power_law_1.01,0.2935935974121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,32,power_law_1.01,0.2984832048416138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,32,power_law_1.2,0.29617919921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,32,power_law_1.2,0.30091519355773927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,4,balanced,1.4271094004313152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,4,balanced,1.4365173975626628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,4,power_law_1.01,1.1873536109924316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,4,power_law_1.01,1.214790439605713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,4,power_law_1.2,1.1257280349731444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,4,power_law_1.2,1.284780788421631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,64,balanced,0.23666665951410928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,64,balanced,0.23826134204864502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,64,power_law_1.01,0.22525439262390137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,64,power_law_1.01,0.23601279258728028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,64,power_law_1.2,0.22368640899658204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,64,power_law_1.2,0.22899200916290283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,8,balanced,0.8044799963633219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,8,balanced,0.8098346392313639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,8,power_law_1.01,0.6867008209228516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,8,power_law_1.01,0.6984447956085205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,8,power_law_1.2,0.6086463928222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,1,8,power_law_1.2,0.697657585144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,16,1,balanced,0.4896053473154704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,16,1,balanced,0.49218134085337323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,16,1,power_law_1.01,0.42442879676818845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,16,1,power_law_1.01,0.4247488021850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,16,1,power_law_1.2,0.41930241584777833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,16,1,power_law_1.2,0.4217984199523926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,2,1,balanced,2.728015899658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,2,1,balanced,2.7500425974527993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,2,1,power_law_1.01,1.9948287963867188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,2,1,power_law_1.01,2.0515520095825197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,2,1,power_law_1.2,1.9387712478637695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,2,1,power_law_1.2,1.976736068725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,32,1,balanced,0.35499731699625653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,32,1,balanced,0.35573331514994305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,32,1,power_law_1.01,0.30271999835968016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,32,1,power_law_1.01,0.30391678810119627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,32,1,power_law_1.2,0.29663360118865967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,32,1,power_law_1.2,0.2974015951156616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,4,1,balanced,1.3584052721659343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,4,1,balanced,1.3854293823242188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,4,1,power_law_1.01,1.0727744102478027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,4,1,power_law_1.01,1.0882752418518067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,4,1,power_law_1.2,1.027667236328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,4,1,power_law_1.2,1.0604607582092285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,8,1,balanced,0.7824693520863851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,8,1,balanced,0.7848693529764811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,8,1,power_law_1.01,0.6175615787506104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,8,1,power_law_1.01,0.6224448204040527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,8,1,power_law_1.2,0.6066751956939698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,128,7168,2048,8,384,8,1,power_law_1.2,0.609657621383667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,1,balanced,0.32080533107121784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,1,balanced,0.3261386752128601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,1,power_law_1.01,0.357043194770813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,1,power_law_1.01,0.36110720634460447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,1,power_law_1.2,0.36757121086120603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,1,power_law_1.2,0.36815359592437746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,128,balanced,0.10617066423098247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,128,balanced,0.10929066936175029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,128,power_law_1.01,0.11031039953231811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,128,power_law_1.01,0.11068160533905029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,128,power_law_1.2,0.11318399906158447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,128,power_law_1.2,0.11673599481582642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,16,balanced,0.12027733524640401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,16,balanced,0.12250133355458577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,16,power_law_1.01,0.12988799810409546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,16,power_law_1.01,0.13081599473953248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,16,power_law_1.2,0.13607679605484008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,16,power_law_1.2,0.13626240491867064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,2,balanced,0.22887466351191202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,2,balanced,0.23190399010976157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,2,power_law_1.01,0.26368639469146726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,2,power_law_1.01,0.266431999206543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,2,power_law_1.2,0.2742271900177002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,2,power_law_1.2,0.27619199752807616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,32,balanced,0.11403200030326843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,32,balanced,0.11486400167147319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,32,power_law_1.01,0.11905920505523682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,32,power_law_1.01,0.1201024055480957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,32,power_law_1.2,0.12153600454330445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,32,power_law_1.2,0.12275840044021606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,4,balanced,0.1710453430811564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,4,balanced,0.17122666041056314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,4,power_law_1.01,0.1974527955055237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,4,power_law_1.01,0.1980288028717041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,4,power_law_1.2,0.1982591986656189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,4,power_law_1.2,0.20078721046447753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,64,balanced,0.10937066872914632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,64,balanced,0.11097600062688191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,64,power_law_1.01,0.11466879844665527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,64,power_law_1.01,0.11477760076522828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,64,power_law_1.2,0.1177664041519165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,64,power_law_1.2,0.11851520538330078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,8,balanced,0.1358506679534912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,8,balanced,0.1360266705354055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,8,power_law_1.01,0.15200639963150026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,8,power_law_1.01,0.15593600273132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,8,power_law_1.2,0.16161919832229615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,1,8,power_law_1.2,0.16222720146179198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,2,1,balanced,0.20558400948842367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,2,1,balanced,0.2062186598777771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,2,1,power_law_1.01,0.23639039993286132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,2,1,power_law_1.01,0.23863039016723633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,2,1,power_law_1.2,0.24325120449066162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,2,1,power_law_1.2,0.24741120338439943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,4,1,balanced,0.15371732910474142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,4,1,balanced,0.1562399963537852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,4,1,power_law_1.01,0.16741759777069093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,4,1,power_law_1.01,0.168012797832489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,4,1,power_law_1.2,0.1684864044189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2048,768,8,128,4,1,power_law_1.2,0.17496960163116454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,1,balanced,0.7861386934916178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,1,balanced,0.7921013037363688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,1,power_law_1.01,0.8514623641967773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,1,power_law_1.01,0.8664575576782226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,1,power_law_1.2,0.8774975776672364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,1,power_law_1.2,0.8870783805847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,128,balanced,0.13994133472442627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,128,balanced,0.1421119968096415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,128,power_law_1.01,0.14961279630661012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,128,power_law_1.01,0.15302400588989257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,128,power_law_1.2,0.16020480394363404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,128,power_law_1.2,0.16284159421920777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,16,balanced,0.18307199080785116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,16,balanced,0.1844266653060913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,16,power_law_1.01,0.2088383913040161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,16,power_law_1.01,0.20995841026306153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,16,power_law_1.2,0.21886079311370848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,16,power_law_1.2,0.2264319896697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,2,balanced,0.4910399913787842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,2,balanced,0.4935893217722575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,2,power_law_1.01,0.5528895854949951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,2,power_law_1.01,0.556876802444458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,2,power_law_1.2,0.5666048049926757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,2,power_law_1.2,0.5687488079071045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,32,balanced,0.15636266271273294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,32,balanced,0.15650666753451029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,32,power_law_1.01,0.17386239767074585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,32,power_law_1.01,0.17782399654388428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,32,power_law_1.2,0.1843008041381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,32,power_law_1.2,0.19447679519653321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,4,balanced,0.3237173358599345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,4,balanced,0.32445865869522095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,4,power_law_1.01,0.3582655906677246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,4,power_law_1.01,0.360697603225708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,4,power_law_1.2,0.3622656106948853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,4,power_law_1.2,0.3737152099609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,64,balanced,0.14485866824785867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,64,balanced,0.14577066898345947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,64,power_law_1.01,0.15648640394210817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,64,power_law_1.01,0.16072959899902345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,64,power_law_1.2,0.16930559873580933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,64,power_law_1.2,0.17103359699249268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,8,balanced,0.23238933086395264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,8,balanced,0.2328746716181437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,8,power_law_1.01,0.2563776016235352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,8,power_law_1.01,0.2686784029006958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,8,power_law_1.2,0.2686592102050781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,1,8,power_law_1.2,0.2743295907974243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,16,1,balanced,0.295632004737854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,16,1,balanced,0.2958079973856608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,16,1,power_law_1.01,0.36260480880737306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,16,1,power_law_1.01,0.36710400581359864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,16,1,power_law_1.2,0.37229440212249754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,16,1,power_law_1.2,0.3734080076217651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,2,1,balanced,0.4683306614557902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,2,1,balanced,0.46879998842875165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,2,1,power_law_1.01,0.521292781829834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,2,1,power_law_1.01,0.5215231895446777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,2,1,power_law_1.2,0.5314047813415528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,2,1,power_law_1.2,0.5345727920532226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,32,1,balanced,0.24253332614898682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,32,1,balanced,0.24290666977564493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,32,1,power_law_1.01,0.3021631956100464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,32,1,power_law_1.01,0.3027071952819824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,32,1,power_law_1.2,0.3058687925338745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,32,1,power_law_1.2,0.308409595489502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,4,1,balanced,0.29259733359018963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,4,1,balanced,0.2935946583747864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,4,1,power_law_1.01,0.32560000419616697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,4,1,power_law_1.01,0.3273920059204102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,4,1,power_law_1.2,0.33281280994415285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,4,1,power_law_1.2,0.33413760662078856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,8,1,balanced,0.38389865557352704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,8,1,balanced,0.3840159972508748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,8,1,power_law_1.01,0.4625728130340576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,8,1,power_law_1.01,0.46689281463623045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,8,1,power_law_1.2,0.47657599449157717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,2688,1856,6,128,8,1,power_law_1.2,0.4788095951080322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,1,balanced,1.4559520085652669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,1,balanced,1.4918239911397297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,1,power_law_1.01,1.4841983795166016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,1,power_law_1.01,1.4870464324951171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,1,power_law_1.2,1.559059238433838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,1,power_law_1.2,1.5616127967834472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,128,balanced,0.19318399826685587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,128,balanced,0.194650669892629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,128,power_law_1.01,0.20247039794921876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,128,power_law_1.01,0.2037247896194458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,128,power_law_1.2,0.20595839023590087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,128,power_law_1.2,0.2110975980758667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,16,balanced,0.27004800240198773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,16,balanced,0.27025065819422406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,16,power_law_1.01,0.28538239002227783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,16,power_law_1.01,0.288703989982605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,16,power_law_1.2,0.297158408164978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,16,power_law_1.2,0.30035200119018557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,2,balanced,0.8284906546274821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,2,balanced,0.8308586279551188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,2,power_law_1.01,0.8443648338317871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,2,power_law_1.01,0.8652992248535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,2,power_law_1.2,0.8772992134094239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,2,power_law_1.2,0.8995136260986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,256,balanced,0.18685332934061685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,256,balanced,0.18702399730682373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,256,power_law_1.01,0.19163520336151124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,256,power_law_1.01,0.19418879747390747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,256,power_law_1.2,0.2000960111618042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,256,power_law_1.2,0.201580810546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,32,balanced,0.22392533222834268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,32,balanced,0.22571200132369995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,32,power_law_1.01,0.24458880424499513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,32,power_law_1.01,0.246124792098999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,32,power_law_1.2,0.2518719911575317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,32,power_law_1.2,0.25248639583587645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,4,balanced,0.5154133240381876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,4,balanced,0.5157013336817423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,4,power_law_1.01,0.5369855880737304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,4,power_law_1.01,0.5438015937805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,4,power_law_1.2,0.549945592880249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,4,power_law_1.2,0.5551807880401611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,64,balanced,0.2032159964243571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,64,balanced,0.20347734292348227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,64,power_law_1.01,0.21650559902191163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,64,power_law_1.01,0.21848320960998535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,64,power_law_1.2,0.2222656011581421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,64,power_law_1.2,0.22525439262390137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,8,balanced,0.35067200660705566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,8,balanced,0.35096001625061035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,8,power_law_1.01,0.36663041114807127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,8,power_law_1.01,0.37182719707489015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,8,power_law_1.2,0.3842367887496948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,1,8,power_law_1.2,0.38664960861206055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,16,1,balanced,0.2520959973335266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,16,1,balanced,0.25255467494328815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,16,1,power_law_1.01,0.259769606590271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,16,1,power_law_1.01,0.2600383996963501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,16,1,power_law_1.2,0.2823744058609009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,16,1,power_law_1.2,0.28879361152648925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,2,1,balanced,0.8022613525390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,2,1,balanced,0.810869296391805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,2,1,power_law_1.01,0.8146559715270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,2,1,power_law_1.01,0.8158207893371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,2,1,power_law_1.2,0.8573823928833008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,2,1,power_law_1.2,0.8706879615783691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,32,1,balanced,0.20424532890319824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,32,1,balanced,0.20427733659744263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,32,1,power_law_1.01,0.21161599159240724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,32,1,power_law_1.01,0.21203839778900146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,32,1,power_law_1.2,0.23244800567626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,32,1,power_law_1.2,0.2362879991531372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,4,1,balanced,0.48129598299662274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,4,1,balanced,0.4821973244349162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,4,1,power_law_1.01,0.48200321197509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,4,1,power_law_1.01,0.49059200286865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,4,1,power_law_1.2,0.509887981414795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,4,1,power_law_1.2,0.5169536113739014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,8,1,balanced,0.3179519971211751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,8,1,balanced,0.31807466348012287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,8,1,power_law_1.01,0.32047998905181885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,8,1,power_law_1.01,0.3244607925415039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,8,1,power_law_1.2,0.3457855939865112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,3072,1536,8,256,8,1,power_law_1.2,0.3540031909942627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,1,balanced,1.3682719866434734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,1,balanced,1.377354621887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,1,power_law_1.01,1.5492032051086426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,1,power_law_1.01,1.5659263610839844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,1,power_law_1.2,1.561843204498291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,1,power_law_1.2,1.5749247550964356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,2,balanced,0.8097226619720459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,2,balanced,0.8141547044118246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,2,power_law_1.01,1.0140416145324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,2,power_law_1.01,1.1507967948913573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,2,power_law_1.2,1.06046724319458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,2,power_law_1.2,1.1207615852355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,4,balanced,0.4866986672083537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,4,balanced,0.4891200065612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,4,power_law_1.01,0.7715648174285888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,4,power_law_1.01,0.9129664421081543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,4,power_law_1.2,0.7924416065216064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,4,power_law_1.2,0.9040384292602539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,8,balanced,0.39163732528686523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,8,balanced,0.39361600081125897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,8,power_law_1.01,0.6588096141815185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,8,power_law_1.01,0.668390417098999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,8,power_law_1.2,0.6892799854278564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,1,8,power_law_1.2,0.7170623779296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,16,1,balanced,0.15124799807866415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,16,1,balanced,0.15197333693504333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,16,1,power_law_1.01,0.15943039655685426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,16,1,power_law_1.01,0.16325759887695312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,16,1,power_law_1.2,0.160588800907135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,16,1,power_law_1.2,0.16240639686584474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,2,1,balanced,0.7101706663767496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,2,1,balanced,0.7159573237101237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,2,1,power_law_1.01,0.7913663864135743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,2,1,power_law_1.01,0.8044608116149903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,2,1,power_law_1.2,0.7539904117584229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,2,1,power_law_1.2,0.7944960117340087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,32,1,balanced,0.10122133294741313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,32,1,balanced,0.1013759970664978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,32,1,power_law_1.01,0.10769920349121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,32,1,power_law_1.01,0.10802559852600098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,32,1,power_law_1.2,0.10774400234222412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,32,1,power_law_1.2,0.10903040170669556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,4,1,balanced,0.37404799461364746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,4,1,balanced,0.376362681388855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,4,1,power_law_1.01,0.4246208190917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,4,1,power_law_1.01,0.4253568172454834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,4,1,power_law_1.2,0.42092161178588866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,4,1,power_law_1.2,0.42357120513916013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,8,1,balanced,0.22383999824523926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,8,1,balanced,0.2246346672375997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,8,1,power_law_1.01,0.2382080078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,8,1,power_law_1.01,0.23899519443511963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,8,1,power_law_1.2,0.23364479541778566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,14336,2,8,8,1,power_law_1.2,0.2403007984161377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,1,balanced,1.0408426920572917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,1,balanced,1.0480373700459797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,1,power_law_1.01,1.2555007934570312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,1,power_law_1.01,1.2617600440979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,1,power_law_1.2,1.2961600303649903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,1,power_law_1.2,1.3034111976623535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,128,balanced,0.19101866086324057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,128,balanced,0.1911840041478475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,128,power_law_1.01,0.2023103952407837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,128,power_law_1.01,0.20538880825042724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,128,power_law_1.2,0.21969280242919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,128,power_law_1.2,0.22386560440063477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,16,balanced,0.23005332549413046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,16,balanced,0.23145600159962973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,16,power_law_1.01,0.2732032060623169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,16,power_law_1.01,0.2917952060699463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,16,power_law_1.2,0.28592638969421386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,16,power_law_1.2,0.2859328031539917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,2,balanced,0.6280426581700643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,2,balanced,0.6303946574529012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,2,power_law_1.01,0.7401023864746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,2,power_law_1.01,0.7441535949707031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,2,power_law_1.2,0.773638391494751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,2,power_law_1.2,0.7859392166137695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,32,balanced,0.20245333512624106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,32,balanced,0.20294400056203207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,32,power_law_1.01,0.23516159057617186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,32,power_law_1.01,0.24354560375213624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,32,power_law_1.2,0.2543872117996216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,32,power_law_1.2,0.2579904079437256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,4,balanced,0.39716267585754395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,4,balanced,0.39768532911936444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,4,power_law_1.01,0.48748159408569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,4,power_law_1.01,0.49066882133483886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,4,power_law_1.2,0.5041152000427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,4,power_law_1.2,0.5143807888031006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,64,balanced,0.19541333119074503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,64,balanced,0.1956053376197815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,64,power_law_1.01,0.21713919639587403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,64,power_law_1.01,0.2199552059173584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,64,power_law_1.2,0.231660795211792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,64,power_law_1.2,0.2339776039123535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,8,balanced,0.2900213400522868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,8,balanced,0.29037866989771527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,8,power_law_1.01,0.3410559892654419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,8,power_law_1.01,0.341759991645813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,8,power_law_1.2,0.34286720752716066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,1,8,power_law_1.2,0.3650559902191162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,16,1,balanced,0.21090133984883627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,16,1,balanced,0.2119040091832479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,16,1,power_law_1.01,0.2610879898071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,16,1,power_law_1.01,0.2620032072067261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,16,1,power_law_1.2,0.2650943994522095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,16,1,power_law_1.2,0.2655679941177368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,2,1,balanced,0.5770293474197388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,2,1,balanced,0.5780106782913208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,2,1,power_law_1.01,0.6435071945190429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,2,1,power_law_1.01,0.6468095779418945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,2,1,power_law_1.2,0.6586624145507812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,2,1,power_law_1.2,0.6686079978942872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,32,1,balanced,0.19091200828552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,32,1,balanced,0.19104532400767008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,32,1,power_law_1.01,0.21079039573669434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,32,1,power_law_1.01,0.21181440353393555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,32,1,power_law_1.2,0.2134335994720459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,32,1,power_law_1.2,0.2137984037399292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,4,1,balanced,0.3617759943008423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,4,1,balanced,0.3652373154958089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,4,1,power_law_1.01,0.41971840858459475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,4,1,power_law_1.01,0.4222400188446045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,4,1,power_law_1.2,0.43571839332580564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,4,1,power_law_1.2,0.43692798614501954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,8,1,balanced,0.2697920004526774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,8,1,balanced,0.2728959918022156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,8,1,power_law_1.01,0.29205760955810545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,8,1,power_law_1.01,0.2947968006134033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,8,1,power_law_1.2,0.29989759922027587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,1536,8,128,8,1,power_law_1.2,0.3109888076782227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,1,balanced,6.9451948801676435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,1,balanced,7.007242838541667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,1,power_law_1.01,7.898802947998047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,1,power_law_1.01,7.953997039794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,1,power_law_1.2,8.254694366455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,1,power_law_1.2,8.43154525756836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,128,balanced,0.6759946346282959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,128,balanced,0.6772426764170328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,128,power_law_1.01,0.72674560546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,128,power_law_1.01,0.7301631927490234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,128,power_law_1.2,0.7489535808563232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,128,power_law_1.2,0.7562816143035889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,16,balanced,1.0063040256500244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,16,balanced,1.0083573659261067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,16,power_law_1.01,1.1150400161743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,16,power_law_1.01,1.1275008201599122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,16,power_law_1.2,1.1632960319519043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,16,power_law_1.2,1.1651904106140136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,2,balanced,3.8127733866373696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,2,balanced,3.8762451807657876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,2,power_law_1.01,4.191507339477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,2,power_law_1.01,4.27185287475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,2,power_law_1.2,4.374265670776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,2,power_law_1.2,4.507718276977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,256,balanced,0.65775465965271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,256,balanced,0.6597013473510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,256,power_law_1.01,0.6961919784545898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,256,power_law_1.01,0.6963007926940918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,256,power_law_1.2,0.7133823871612549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,256,power_law_1.2,0.713862419128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,32,balanced,0.8248426914215088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,32,balanced,0.8263893127441406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,32,power_law_1.01,0.8883456230163574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,32,power_law_1.01,0.8964735984802246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,32,power_law_1.2,0.9169599533081054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,32,power_law_1.2,0.9202048301696777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,4,balanced,2.1368959744771323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,4,balanced,2.149439970652262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,4,power_law_1.01,2.4342464447021483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,4,power_law_1.01,2.436972808837891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,4,power_law_1.2,2.4676095962524416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,4,power_law_1.2,2.5278335571289063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,64,balanced,0.7311519781748453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,64,balanced,0.7331146399180094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,64,power_law_1.01,0.789408016204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,64,power_law_1.01,0.7963071823120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,64,power_law_1.2,0.8022272109985351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,64,power_law_1.2,0.823481559753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,8,balanced,1.387722651163737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,8,balanced,1.3887146313985188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,8,power_law_1.01,1.5447551727294921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,8,power_law_1.01,1.553004837036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,8,power_law_1.2,1.599942398071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,1,8,power_law_1.2,1.6213504791259765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,16,1,balanced,1.7718453407287598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,16,1,balanced,1.7744213740030925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,16,1,power_law_1.01,2.0729791641235353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,16,1,power_law_1.01,2.07840633392334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,16,1,power_law_1.2,2.1403583526611327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,16,1,power_law_1.2,2.1452096939086913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,2,1,balanced,3.204069455464681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,2,1,balanced,3.2356745402018228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,2,1,power_law_1.01,3.490304183959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,2,1,power_law_1.01,3.5131649017333983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,2,1,power_law_1.2,3.584806442260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,2,1,power_law_1.2,3.6410495758056642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,32,1,balanced,1.5010347366333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,32,1,balanced,1.5026559829711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,32,1,power_law_1.01,1.7912063598632812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,32,1,power_law_1.01,1.8054336547851562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,32,1,power_law_1.2,1.8686464309692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,32,1,power_law_1.2,1.8722240447998046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,4,1,balanced,4.035349210103353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,4,1,balanced,4.162981351216634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,4,1,power_law_1.01,3.681011199951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,4,1,power_law_1.01,3.7850433349609376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,4,1,power_law_1.2,3.762860870361328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,4,1,power_law_1.2,3.809273529052734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,8,1,balanced,1.1964800357818604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,8,1,balanced,1.2072479724884033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,8,1,power_law_1.01,1.3374527931213378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,8,1,power_law_1.01,1.3397631645202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,8,1,power_law_1.2,1.3824895858764648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,4096,2688,22,512,8,1,power_law_1.2,1.3837504386901855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,1,balanced,2.2443040211995444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,1,balanced,2.348309357961019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,1,power_law_1.01,2.486848068237305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,1,power_law_1.01,2.5033536911010743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,1,power_law_1.2,2.475948715209961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,1,power_law_1.2,2.5261503219604493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,2,balanced,1.182421366373698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,2,balanced,1.188383976618449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,2,power_law_1.01,1.604115104675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,2,power_law_1.01,1.6929855346679688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,2,power_law_1.2,1.6223487854003906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,2,power_law_1.2,1.6528959274291992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,4,balanced,0.681978702545166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,4,balanced,0.6847093105316162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,4,power_law_1.01,1.267520046234131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,4,power_law_1.01,1.2797439575195313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,4,power_law_1.2,1.2435199737548828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,4,power_law_1.2,1.3473919868469237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,8,balanced,0.4979786475499471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,8,balanced,0.49928001562754315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,8,power_law_1.01,0.990995216369629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,8,power_law_1.01,1.0462528228759767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,8,power_law_1.2,1.0064255714416503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,1,8,power_law_1.2,1.0388223648071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,16,1,balanced,0.21777600049972534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,16,1,balanced,0.21837333838144937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,16,1,power_law_1.01,0.2253887891769409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,16,1,power_law_1.01,0.23175039291381835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,16,1,power_law_1.2,0.2286207914352417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,16,1,power_law_1.2,0.23029758930206298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,2,1,balanced,1.137712001800537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,2,1,balanced,1.140559991200765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,2,1,power_law_1.01,1.2575039863586426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,2,1,power_law_1.01,1.2761856079101563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,2,1,power_law_1.2,1.2491904258728028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,2,1,power_law_1.2,1.2537856101989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,32,1,balanced,0.14141333103179932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,32,1,balanced,0.14215466380119324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,32,1,power_law_1.01,0.149126398563385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,32,1,power_law_1.01,0.15067520141601562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,32,1,power_law_1.2,0.14913920164108277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,32,1,power_law_1.2,0.1494271993637085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,4,1,balanced,0.6016266743342081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,4,1,balanced,0.615066647529602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,4,1,power_law_1.01,0.6629951953887939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,4,1,power_law_1.01,0.6677824020385742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,4,1,power_law_1.2,0.6588799953460693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,4,1,power_law_1.2,0.6718912124633789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,8,1,balanced,0.3240799903869629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,8,1,balanced,0.3281866709391276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,8,1,power_law_1.01,0.3637439966201782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,8,1,power_law_1.01,0.37718400955200193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,8,1,power_law_1.2,0.36062719821929934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,16384,2,8,8,1,power_law_1.2,0.37355520725250246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,1,balanced,3.8584534327189126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,1,balanced,3.9280319213867188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,1,power_law_1.01,3.83109130859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,1,power_law_1.01,3.9774913787841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,1,power_law_1.2,4.087859344482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,1,power_law_1.2,4.195353698730469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,128,balanced,0.31647467613220215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,128,balanced,0.3166346748669942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,128,power_law_1.01,0.33870720863342285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,128,power_law_1.01,0.33968000411987304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,128,power_law_1.2,0.3558464050292969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,128,power_law_1.2,0.35916800498962403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,16,balanced,0.5003733237584432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,16,balanced,0.5017013152440389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,16,power_law_1.01,0.5356351852416992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,16,power_law_1.01,0.5504320144653321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,16,power_law_1.2,0.5532608032226562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,16,power_law_1.2,0.5661119937896728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,2,balanced,2.03438393274943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,2,balanced,2.0593813260396323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,2,power_law_1.01,2.072147178649902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,2,power_law_1.01,2.079654312133789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,2,power_law_1.2,2.1645503997802735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,2,power_law_1.2,2.2725503921508787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,256,balanced,0.3078933358192444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,256,balanced,0.30877333879470825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,256,power_law_1.01,0.3227839946746826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,256,power_law_1.01,0.3247551918029785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,256,power_law_1.2,0.3352895975112915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,256,power_law_1.2,0.34133119583129884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,32,balanced,0.39580798149108887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,32,balanced,0.3969279925028483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,32,power_law_1.01,0.42865920066833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,32,power_law_1.01,0.43279361724853516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,32,power_law_1.2,0.44815998077392577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,32,power_law_1.2,0.45674881935119627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,4,balanced,1.1315733591715496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,4,balanced,1.141434669494629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,4,power_law_1.01,1.1765119552612304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,4,power_law_1.01,1.20831356048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,4,power_law_1.2,1.2272768020629883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,4,power_law_1.2,1.258176040649414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,64,balanced,0.3366080125172933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,64,balanced,0.3380053440729777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,64,power_law_1.01,0.37121920585632323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,64,power_law_1.01,0.37242879867553713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,64,power_law_1.2,0.3851327896118164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,64,power_law_1.2,0.3949376106262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,8,balanced,0.7103412946065267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,8,balanced,0.7124213377634684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,8,power_law_1.01,0.7521664142608643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,8,power_law_1.01,0.7578879833221436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,8,power_law_1.2,0.7757887840270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,1,8,power_law_1.2,0.7800576210021972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,16,1,balanced,0.47550400098164874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,16,1,balanced,0.47623999913533527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,16,1,power_law_1.01,0.4833536148071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,16,1,power_law_1.01,0.4846975803375244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,16,1,power_law_1.2,0.5374656200408936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,16,1,power_law_1.2,0.5401663780212402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,2,1,balanced,1.923631985982259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,2,1,balanced,1.971274693806966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,2,1,power_law_1.01,1.9718463897705079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,2,1,power_law_1.01,1.9931520462036132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,2,1,power_law_1.2,2.048928070068359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,2,1,power_law_1.2,2.1091903686523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,32,1,balanced,0.3752053181330363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,32,1,balanced,0.37699735164642334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,32,1,power_law_1.01,0.38978559970855714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,32,1,power_law_1.01,0.39907839298248293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,32,1,power_law_1.2,0.4397439956665039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,32,1,power_law_1.2,0.4398208141326904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,4,1,balanced,1.076464017232259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,4,1,balanced,1.0837706724802654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,4,1,power_law_1.01,1.1038592338562012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,4,1,power_law_1.01,1.1108160018920898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,4,1,power_law_1.2,1.1674495697021485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,4,1,power_law_1.2,1.1704256057739257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,8,1,balanced,0.6823200384775797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,8,1,balanced,0.6847946643829346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,8,1,power_law_1.01,0.6907328128814697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,8,1,power_law_1.01,0.6985280036926269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,8,1,power_law_1.2,0.7350656032562256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2048,8,256,8,1,power_law_1.2,0.7487040042877198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,1,balanced,3.0246880849202475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,1,balanced,3.0821119944254556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,1,power_law_1.01,3.624505615234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,1,power_law_1.01,3.6408382415771485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,1,power_law_1.2,3.692063903808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,1,power_law_1.2,3.7204097747802733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,16,balanced,0.4365333318710327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,16,balanced,0.43676801522572833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,16,power_law_1.01,0.5268991947174072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,16,power_law_1.01,0.5418432235717774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,16,power_law_1.2,0.5529856204986572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,16,power_law_1.2,0.5537216186523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,2,balanced,1.6251145998636882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,2,balanced,1.6492640177408855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,2,power_law_1.01,1.8832319259643555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,2,power_law_1.01,1.9551359176635743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,2,power_law_1.2,1.973593521118164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,2,power_law_1.2,2.0177919387817385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,32,balanced,0.3494186798731486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,32,balanced,0.35126932462056476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,32,power_law_1.01,0.42028160095214845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,32,power_law_1.01,0.42583680152893066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,32,power_law_1.2,0.4595776081085205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,32,power_law_1.2,0.46077442169189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,4,balanced,0.9345013300577799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,4,balanced,0.9363839626312256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,4,power_law_1.01,1.109267234802246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,4,power_law_1.01,1.1301504135131837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,4,power_law_1.2,1.1688575744628906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,4,power_law_1.2,1.1810943603515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,8,balanced,0.603333314259847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,8,balanced,0.6049600044886271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,8,power_law_1.01,0.7195583820343018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,8,power_law_1.01,0.731705617904663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,8,power_law_1.2,0.7830143928527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,1,8,power_law_1.2,0.804748821258545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,16,1,balanced,0.4010239839553833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,16,1,balanced,0.4022773504257202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,16,1,power_law_1.01,0.47624959945678713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,16,1,power_law_1.01,0.48115200996398927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,16,1,power_law_1.2,0.48107519149780276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,16,1,power_law_1.2,0.4827583789825439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,2,1,balanced,1.5719146728515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,2,1,balanced,1.6138346989949544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,2,1,power_law_1.01,1.8031744003295898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,2,1,power_law_1.01,1.818355178833008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,2,1,power_law_1.2,1.852774429321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,2,1,power_law_1.2,1.8735872268676759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,32,1,balanced,0.36181334654490155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,32,1,balanced,0.3618239959081014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,32,1,power_law_1.01,0.39317760467529295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,32,1,power_law_1.01,0.39565439224243165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,32,1,power_law_1.2,0.39797120094299315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,32,1,power_law_1.2,0.3989504098892212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,4,1,balanced,0.889631986618042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,4,1,balanced,0.8985653718312582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,4,1,power_law_1.01,1.020742416381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,4,1,power_law_1.01,1.0208448410034179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,4,1,power_law_1.2,1.0398847579956054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,4,1,power_law_1.2,1.0410816192626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,8,1,balanced,0.5401120185852051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,8,1,balanced,0.5410986741383871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,8,1,power_law_1.01,0.6199935913085938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,8,1,power_law_1.01,0.6238719940185546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,8,1,power_law_1.2,0.6281216144561768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,6144,2560,8,160,8,1,power_law_1.2,0.6300864219665527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,1,balanced,4.41702938079834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,1,balanced,4.461866696675618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,1,power_law_1.01,4.527833557128906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,1,power_law_1.01,4.585177612304688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,1,power_law_1.2,4.734905624389649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,1,power_law_1.2,4.942086410522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,128,balanced,0.34616533915201825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,128,balanced,0.3466506799062093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,128,power_law_1.01,0.37925760746002196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,128,power_law_1.01,0.3808511972427368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,128,power_law_1.2,0.390118408203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,128,power_law_1.2,0.3952640056610107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,16,balanced,0.5654720067977905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,16,balanced,0.5661919911702474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,16,power_law_1.01,0.6014912128448486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,16,power_law_1.01,0.6020031929016113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,16,power_law_1.2,0.6298495769500733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,16,power_law_1.2,0.6322559833526611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,2,balanced,2.43013858795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,2,balanced,2.4441653887430825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,2,power_law_1.01,2.4675199508666994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,2,power_law_1.01,2.512633514404297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,2,power_law_1.2,2.439455986022949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,2,power_law_1.2,2.5474111557006838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,256,balanced,0.33628801504770917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,256,balanced,0.33872000376383465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,256,power_law_1.01,0.3536704063415527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,256,power_law_1.01,0.35576319694519043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,256,power_law_1.2,0.3714303970336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,256,power_law_1.2,0.3753024101257324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,32,balanced,0.44066667556762695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,32,balanced,0.4407840172449748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,32,power_law_1.01,0.47424001693725587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,32,power_law_1.01,0.47426562309265136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,32,power_law_1.2,0.5016320228576661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,32,power_law_1.2,0.5031680107116699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,4,balanced,1.3079893589019775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,4,balanced,1.309221347173055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,4,power_law_1.01,1.3577664375305176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,4,power_law_1.01,1.3936448097229004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,4,power_law_1.2,1.4244159698486327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,4,power_law_1.2,1.4545472145080567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,64,balanced,0.3717706600824992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,64,balanced,0.37349867820739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,64,power_law_1.01,0.40843520164489744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,64,power_law_1.01,0.41800317764282224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,64,power_law_1.2,0.4286719799041748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,64,power_law_1.2,0.43381757736206056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,8,balanced,0.8085599740346273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,8,balanced,0.8107519944508871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,8,power_law_1.01,0.8592255592346192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,8,power_law_1.01,0.8710207939147949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,8,power_law_1.2,0.9114751815795898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,1,8,power_law_1.2,0.9118783950805665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,16,1,balanced,0.5489120086034139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,16,1,balanced,0.5497226715087891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,16,1,power_law_1.01,0.5607359886169434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,16,1,power_law_1.01,0.567199993133545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,16,1,power_law_1.2,0.6173247814178466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,16,1,power_law_1.2,0.6246399879455566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,2,1,balanced,2.2280799547831216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,2,1,balanced,2.3799306551615396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,2,1,power_law_1.01,2.2957759857177735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,2,1,power_law_1.01,2.335206413269043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,2,1,power_law_1.2,2.419820785522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,2,1,power_law_1.2,2.4640064239501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,32,1,balanced,0.4299733241399129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,32,1,balanced,0.4312693277994792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,32,1,power_law_1.01,0.4440000057220459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,32,1,power_law_1.01,0.44415998458862305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,32,1,power_law_1.2,0.49752321243286135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,32,1,power_law_1.2,0.5058559894561767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,4,1,balanced,1.2421813011169434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,4,1,balanced,1.2772106329600017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,4,1,power_law_1.01,1.2810879707336427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,4,1,power_law_1.01,1.2925888061523438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,4,1,power_law_1.2,1.3502400398254395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,4,1,power_law_1.2,1.3527551651000977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,8,1,balanced,0.7915573120117188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,8,1,balanced,0.7932799657185873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,8,1,power_law_1.01,0.8003264427185058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,8,1,power_law_1.01,0.8045951843261718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,8,1,power_law_1.2,0.8689599990844726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,256,8,1,power_law_1.2,0.8726847648620606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,1,balanced,6.395088195800781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,1,balanced,6.783349355061849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,1,power_law_1.01,6.197356796264648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,1,power_law_1.01,6.20173454284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,1,power_law_1.2,6.473152160644531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,1,power_law_1.2,6.738393402099609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,128,balanced,0.41649067401885986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,128,balanced,0.41737067699432373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,128,power_law_1.01,0.43108482360839845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,128,power_law_1.01,0.4384448051452637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,128,power_law_1.2,0.4488704204559326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,128,power_law_1.2,0.45469441413879397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,16,balanced,0.7394933700561523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,16,balanced,0.7403733730316162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,16,power_law_1.01,0.7389120101928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,16,power_law_1.01,0.7412032127380371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,16,power_law_1.2,0.7726463794708252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,16,power_law_1.2,0.7861824035644531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,2,balanced,3.4595413208007812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,2,balanced,3.6513760884602866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,2,power_law_1.01,3.1777088165283205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,2,power_law_1.01,3.2829822540283202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,2,power_law_1.2,3.375584030151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,2,power_law_1.2,3.397747039794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,32,balanced,0.5638026793797811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,32,balanced,0.565882682800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,32,power_law_1.01,0.5675968170166016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,32,power_law_1.01,0.5821311950683594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,32,power_law_1.2,0.5810944080352783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,32,power_law_1.2,0.5831488132476806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,4,balanced,1.8360479672749836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,4,balanced,1.8840586344401042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,4,power_law_1.01,1.737548828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,4,power_law_1.01,1.7952192306518555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,4,power_law_1.2,1.8263616561889648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,4,power_law_1.2,1.8342144012451171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,64,balanced,0.4620906511942546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,64,balanced,0.4634773333867391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,64,power_law_1.01,0.48024959564208985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,64,power_law_1.01,0.4857920169830322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,64,power_law_1.2,0.497376012802124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,64,power_law_1.2,0.509984016418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,8,balanced,1.1129546960194905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,8,balanced,1.1159466902414958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,8,power_law_1.01,1.063315200805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,8,power_law_1.01,1.0919360160827636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,8,power_law_1.2,1.1381440162658691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,1,8,power_law_1.2,1.1512384414672852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,16,1,balanced,0.7569066683451334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,16,1,balanced,0.758944034576416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,16,1,power_law_1.01,0.7337664127349853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,16,1,power_law_1.01,0.7379648208618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,16,1,power_law_1.2,0.7522624015808106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,16,1,power_law_1.2,0.7546432018280029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,2,1,balanced,3.401151974995931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,2,1,balanced,3.402186711629232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,2,1,power_law_1.01,3.0964927673339844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,2,1,power_law_1.01,3.136358451843262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,2,1,power_law_1.2,3.2234943389892576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,2,1,power_law_1.2,3.2374526977539064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,32,1,balanced,0.6094933350880941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,32,1,balanced,0.6111840009689331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,32,1,power_law_1.01,0.595577621459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,32,1,power_law_1.01,0.5992063999176025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,32,1,power_law_1.2,0.6077568054199218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,32,1,power_law_1.2,0.6108223915100097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,4,1,balanced,1.8033119837443035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,4,1,balanced,1.836725393931071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,4,1,power_law_1.01,1.6936384201049806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,4,1,power_law_1.01,1.7156095504760742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,4,1,power_law_1.2,1.7690624237060546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,4,1,power_law_1.2,1.7804288864135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,8,1,balanced,1.1218773523966472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,8,1,balanced,1.1229013601938884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,8,1,power_law_1.01,1.0506943702697753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,8,1,power_law_1.01,1.0732992172241211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,8,1,power_law_1.2,1.1025792121887208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,1536,7168,2048,8,384,8,1,power_law_1.2,1.1075263977050782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,1,balanced,0.20462934176127115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,1,balanced,0.2061013380686442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,1,power_law_1.01,0.11578240394592285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,1,power_law_1.01,0.1209663987159729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,1,power_law_1.2,0.11045119762420655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,1,power_law_1.2,0.11077760457992554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,128,balanced,0.02828266719977061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,128,balanced,0.029520000020662945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,128,power_law_1.01,0.02709760069847107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,128,power_law_1.01,0.02768000066280365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,128,power_law_1.2,0.026956799626350402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,128,power_law_1.2,0.02712959945201874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,16,balanced,0.035274667044480644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,16,balanced,0.03566933423280716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,16,power_law_1.01,0.03227519989013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,16,power_law_1.01,0.03373439908027649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,16,power_law_1.2,0.032262399792671204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,16,power_law_1.2,0.03293440043926239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,2,balanced,0.12362666924794515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,2,balanced,0.13421866297721863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,2,power_law_1.01,0.08085759878158569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,2,power_law_1.01,0.08150399923324585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,2,power_law_1.2,0.07459200024604798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,2,power_law_1.2,0.07612800002098083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,32,balanced,0.03124266614516576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,32,balanced,0.0314026673634847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,32,power_law_1.01,0.028255999088287354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,32,power_law_1.01,0.02879360020160675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,32,power_law_1.2,0.028172799944877626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,32,power_law_1.2,0.028384000062942505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,4,balanced,0.07841599980990092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,4,balanced,0.07867733140786488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,4,power_law_1.01,0.05427200198173523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,4,power_law_1.01,0.05775359869003296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,4,power_law_1.2,0.059334397315979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,4,power_law_1.2,0.06177279949188232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,64,balanced,0.029258665939172108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,64,balanced,0.029306667546431225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,64,power_law_1.01,0.027539199590682982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,64,power_law_1.01,0.027852800488471986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,64,power_law_1.2,0.02775680124759674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,64,power_law_1.2,0.028012800216674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,8,balanced,0.0535093347231547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,8,balanced,0.053717335065205894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,8,power_law_1.01,0.041222399473190306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,8,power_law_1.01,0.04508799910545349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,8,power_law_1.2,0.04318720102310181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,1,8,power_law_1.2,0.04460160136222839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,2,1,balanced,0.13052266836166382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,2,1,balanced,0.1318826675415039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,2,1,power_law_1.01,0.07856640219688416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,2,1,power_law_1.01,0.07953280210494995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,2,1,power_law_1.2,0.0741312026977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,2,1,power_law_1.2,0.07564160227775574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,4,1,balanced,0.09178133805592854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,4,1,balanced,0.09232532978057861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,4,1,power_law_1.01,0.05724800229072571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,4,1,power_law_1.01,0.05788159966468811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,4,1,power_law_1.2,0.05542399883270264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2048,768,8,128,4,1,power_law_1.2,0.05610880255699158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,1,balanced,0.4326026837031047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,1,balanced,0.43486932913462323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,1,power_law_1.01,0.2811968088150024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,1,power_law_1.01,0.2903615951538086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,1,power_law_1.2,0.2617343902587891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,1,power_law_1.2,0.2743936061859131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,128,balanced,0.03326933334271113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,128,balanced,0.03341866781314214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,128,power_law_1.01,0.032076799869537355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,128,power_law_1.01,0.032313600182533264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,128,power_law_1.2,0.03283199965953827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,128,power_law_1.2,0.03309440016746521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,16,balanced,0.05712000032265981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,16,balanced,0.05788800120353699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,16,power_law_1.01,0.05160319805145264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,16,power_law_1.01,0.05624960064888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,16,power_law_1.2,0.05642240047454834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,16,power_law_1.2,0.06108800172805786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,2,balanced,0.2387146751085917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,2,balanced,0.24240533510843912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,2,power_law_1.01,0.17326079607009887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,2,power_law_1.01,0.18375680446624756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,2,power_law_1.2,0.14714239835739135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,2,power_law_1.2,0.1770624041557312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,32,balanced,0.04162133236726125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,32,balanced,0.04179200033346812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,32,power_law_1.01,0.04258559942245484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,32,power_law_1.01,0.04467839896678925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,32,power_law_1.2,0.041875201463699344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,32,power_law_1.2,0.04273279905319214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,4,balanced,0.14681599537531534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,4,balanced,0.14728533228238425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,4,power_law_1.01,0.11029759645462037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,4,power_law_1.01,0.11452800035476685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,4,power_law_1.2,0.10929919481277466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,4,power_law_1.2,0.11262719631195069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,64,balanced,0.03746666759252548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,64,balanced,0.03750933210055033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,64,power_law_1.01,0.03620480000972748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,64,power_law_1.01,0.036735999584198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,64,power_law_1.2,0.03563520014286041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,64,power_law_1.2,0.03617919981479645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,8,balanced,0.09133866429328918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,8,balanced,0.0921493371327718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,8,power_law_1.01,0.08289920091629029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,8,power_law_1.01,0.09066240191459655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,8,power_law_1.2,0.08060160279273987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,1,8,power_law_1.2,0.08896639943122864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,16,1,balanced,0.1693120002746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,16,1,balanced,0.1697546641031901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,16,1,power_law_1.01,0.1120959997177124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,16,1,power_law_1.01,0.11509759426116943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,16,1,power_law_1.2,0.10372480154037475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,16,1,power_law_1.2,0.10677759647369385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,2,1,balanced,0.24300267299016318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,2,1,balanced,0.24505066871643066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,2,1,power_law_1.01,0.1637503981590271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,2,1,power_law_1.01,0.16437760591506959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,2,1,power_law_1.2,0.15578880310058593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,32,1,balanced,0.15598932902018228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,32,1,balanced,0.1562879979610443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,32,1,power_law_1.01,0.10116480588912964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,32,1,power_law_1.01,0.10393600463867188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,32,1,power_law_1.2,0.09436799883842469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,32,1,power_law_1.2,0.09784319996833801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,4,1,balanced,0.15272000432014465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,4,1,balanced,0.15519466996192932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,4,1,power_law_1.01,0.10164480209350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,4,1,power_law_1.01,0.10584959983825684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,4,1,power_law_1.2,0.09219200015068055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,4,1,power_law_1.2,0.09425920248031616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,8,1,balanced,0.21361599365870157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,8,1,balanced,0.2143146594365438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,8,1,power_law_1.01,0.1417407989501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,8,1,power_law_1.01,0.14362879991531372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,8,1,power_law_1.2,0.12463359832763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,2688,1856,6,128,8,1,power_law_1.2,0.13011200428009034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,1,balanced,0.5419840017954508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,1,balanced,0.543994665145874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,1,power_law_1.01,0.4153088092803955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,1,power_law_1.01,0.4254784107208252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,1,power_law_1.2,0.36878080368041993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,1,power_law_1.2,0.37792000770568845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,128,balanced,0.033439998825391136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,128,balanced,0.033514666060606636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,128,power_law_1.01,0.034041601419448855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,128,power_law_1.01,0.034483200311660765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,128,power_law_1.2,0.033670398592948916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,128,power_law_1.2,0.03446399867534637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,16,balanced,0.06544533371925354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,16,balanced,0.06635199983914693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,16,power_law_1.01,0.09635199904441834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,16,power_law_1.01,0.09773439764976502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,16,power_law_1.2,0.09709439873695373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,16,power_law_1.2,0.09794560074806213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,2,balanced,0.2921760082244873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,2,balanced,0.29411200682322186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,2,power_law_1.01,0.2596927881240845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,2,power_law_1.01,0.2720896005630493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,2,power_law_1.2,0.2378432035446167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,2,power_law_1.2,0.23821439743041992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,256,balanced,0.033626665671666466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,256,balanced,0.03523733218510946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,256,power_law_1.01,0.032358399033546446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,256,power_law_1.01,0.03283840119838714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,256,power_law_1.2,0.03281919956207276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,256,power_law_1.2,0.03348479866981506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,32,balanced,0.04589866598447164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,32,balanced,0.04775999983151754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,32,power_law_1.01,0.06179839968681335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,32,power_law_1.01,0.062009602785110474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,32,power_law_1.2,0.05694079995155334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,32,power_law_1.2,0.06053119897842407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,4,balanced,0.17730132738749185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,4,balanced,0.17810134092966715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,4,power_law_1.01,0.18001919984817505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,4,power_law_1.01,0.19695359468460083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,4,power_law_1.2,0.16939519643783568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,4,power_law_1.2,0.17953920364379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,64,balanced,0.035360001027584076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,64,balanced,0.035642666121323906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,64,power_law_1.01,0.04175359904766083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,64,power_law_1.01,0.0440447986125946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,64,power_law_1.2,0.04056319892406464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,64,power_law_1.2,0.044121599197387694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,8,balanced,0.1000373363494873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,8,balanced,0.10084799925486247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,8,power_law_1.01,0.15062400102615356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,8,power_law_1.01,0.1511615991592407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,8,power_law_1.2,0.1383679986000061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,1,8,power_law_1.2,0.14622080326080322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,16,1,balanced,0.09412266810735066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,16,1,balanced,0.09490666786829631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,16,1,power_law_1.01,0.07538560032844543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,16,1,power_law_1.01,0.07655680179595947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,16,1,power_law_1.2,0.0695039987564087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,16,1,power_law_1.2,0.07033600211143494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,2,1,balanced,0.2935520013173421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,2,1,balanced,0.30167466402053833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,2,1,power_law_1.01,0.22705280780792236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,2,1,power_law_1.01,0.23191680908203124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,2,1,power_law_1.2,0.20341761112213136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,2,1,power_law_1.2,0.20574719905853273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,32,1,balanced,0.08144000172615051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,32,1,balanced,0.08166933556397755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,32,1,power_law_1.01,0.0687936007976532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,32,1,power_law_1.01,0.06929919719696045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,32,1,power_law_1.2,0.06428800225257873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,32,1,power_law_1.2,0.06453760266304016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,4,1,balanced,0.1800373395284017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,4,1,balanced,0.18070934216181436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,4,1,power_law_1.01,0.14001920223236083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,4,1,power_law_1.2,0.13292160034179687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,4,1,power_law_1.2,0.135481595993042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,8,1,balanced,0.12591466307640076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,8,1,balanced,0.12618666887283325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,8,1,power_law_1.01,0.10548479557037353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,8,1,power_law_1.01,0.10680960416793824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,8,1,power_law_1.2,0.09704319834709167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,3072,1536,8,256,8,1,power_law_1.2,0.09920639991760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,1,balanced,0.478767991065979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,1,balanced,0.4816319942474365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,1,power_law_1.01,0.45352959632873535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,1,power_law_1.01,0.478879976272583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,1,power_law_1.2,0.4765439987182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,1,power_law_1.2,0.48577280044555665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,2,balanced,0.2491733431816101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,2,balanced,0.24994667371114096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,2,power_law_1.01,0.2457792043685913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,2,power_law_1.01,0.25063679218292234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,2,power_law_1.2,0.22732160091400147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,2,power_law_1.2,0.2462847948074341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,4,balanced,0.16427733500798544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,4,balanced,0.170741339524587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,4,power_law_1.01,0.15886720418930053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,4,power_law_1.01,0.15970560312271118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,4,power_law_1.2,0.15808639526367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,4,power_law_1.2,0.1601408004760742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,8,balanced,0.11219200491905212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,8,balanced,0.11563733220100403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,8,power_law_1.01,0.10917760133743286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,8,power_law_1.01,0.1106112003326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,8,power_law_1.2,0.10928640365600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,1,8,power_law_1.2,0.11302399635314941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,16,1,balanced,0.05593066910902659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,16,1,balanced,0.05606933434804281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,16,1,power_law_1.01,0.05287039875984192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,16,1,power_law_1.01,0.05295360088348389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,16,1,power_law_1.2,0.05116159915924072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,16,1,power_law_1.2,0.053388798236846925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,2,1,balanced,0.25471999247868854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,2,1,balanced,0.2563040057818095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,2,1,power_law_1.01,0.241593599319458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,2,1,power_law_1.01,0.2510463953018188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,2,1,power_law_1.2,0.24855680465698243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,2,1,power_law_1.2,0.26458239555358887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,32,1,balanced,0.0352906659245491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,32,1,balanced,0.03801066676775614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,32,1,power_law_1.01,0.034822401404380796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,32,1,power_law_1.01,0.03553920090198517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,32,1,power_law_1.2,0.03537920117378235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,32,1,power_law_1.2,0.03575679957866669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,4,1,balanced,0.14723733067512512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,4,1,balanced,0.16146666804949442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,4,1,power_law_1.01,0.13948160409927368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,4,1,power_law_1.01,0.14368640184402465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,4,1,power_law_1.2,0.13871359825134277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,4,1,power_law_1.2,0.14214400053024293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,8,1,balanced,0.09696533282597859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,8,1,balanced,0.09790933132171631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,8,1,power_law_1.01,0.08551040291786194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,8,1,power_law_1.01,0.08615679740905761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,8,1,power_law_1.2,0.08233600258827209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,14336,2,8,8,1,power_law_1.2,0.0870464026927948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,1,balanced,0.715674638748169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,1,balanced,0.7163840134938558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,1,power_law_1.01,0.37575678825378417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,1,power_law_1.01,0.3844095945358276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,1,power_law_1.2,0.35595519542694093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,1,power_law_1.2,0.3569855928421021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,128,balanced,0.0393653338154157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,128,balanced,0.03945599993069967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,128,power_law_1.01,0.037062400579452516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,128,power_law_1.01,0.037452799081802365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,128,power_law_1.2,0.037196800112724304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,128,power_law_1.2,0.037529599666595456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,16,balanced,0.08064533273379008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,16,balanced,0.0806933343410492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,16,power_law_1.01,0.06771199703216553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,16,power_law_1.01,0.07100160121917724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,16,power_law_1.2,0.06053760051727295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,16,power_law_1.2,0.06470400094985962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,2,balanced,0.37910401821136475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,2,balanced,0.37990931669871014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,2,power_law_1.01,0.23784959316253662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,2,power_law_1.01,0.2396159887313843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,2,power_law_1.2,0.20235519409179686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,2,power_law_1.2,0.21332480907440185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,32,balanced,0.056015998125076294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,32,balanced,0.05610666672388712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,32,power_law_1.01,0.04829440116882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,32,power_law_1.01,0.05065600275993347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,32,power_law_1.2,0.04696959853172302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,32,power_law_1.2,0.052153599262237546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,4,balanced,0.21181867520014444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,4,balanced,0.21209067106246948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,4,power_law_1.01,0.1278656005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,4,power_law_1.01,0.1437440037727356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,4,power_law_1.2,0.131494402885437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,4,power_law_1.2,0.1446272015571594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,64,balanced,0.04165333261092504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,64,balanced,0.0417546679576238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,64,power_law_1.01,0.03939839899539947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,64,power_law_1.01,0.040454399585723874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,64,power_law_1.2,0.03895680010318756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,64,power_law_1.2,0.039724799990653994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,8,balanced,0.12345600128173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,8,balanced,0.12758400042851767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,8,power_law_1.01,0.09649919867515563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,8,power_law_1.01,0.10366719961166382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,8,power_law_1.2,0.09366400241851806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,1,8,power_law_1.2,0.11515519618988038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,16,1,balanced,0.11757866541544597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,16,1,balanced,0.11774933338165283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,16,1,power_law_1.01,0.07388160228729249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,16,1,power_law_1.01,0.07433599829673768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,16,1,power_law_1.2,0.0697983980178833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,16,1,power_law_1.2,0.07089279890060425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,2,1,balanced,0.37610665957132977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,2,1,balanced,0.3835893472035726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,2,1,power_law_1.01,0.2153856039047241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,2,1,power_law_1.01,0.22266879081726074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,2,1,power_law_1.2,0.19705599546432495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,2,1,power_law_1.2,0.19769599437713622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,32,1,balanced,0.10356799761454265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,32,1,balanced,0.1039680043856303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,32,1,power_law_1.01,0.0656000018119812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,32,1,power_law_1.01,0.066348797082901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,32,1,power_law_1.2,0.062080001831054686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,32,1,power_law_1.2,0.0634112000465393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,4,1,balanced,0.22846933205922446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,4,1,balanced,0.23051732778549194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,4,1,power_law_1.01,0.12983039617538453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,4,1,power_law_1.01,0.13156479597091675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,4,1,power_law_1.2,0.1230463981628418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,4,1,power_law_1.2,0.12403199672698975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,8,1,balanced,0.15820800264676413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,8,1,balanced,0.16025066375732422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,8,1,power_law_1.01,0.09311360120773315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,8,1,power_law_1.01,0.09709439873695373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,8,1,power_law_1.2,0.08675839900970458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,1536,8,128,8,1,power_law_1.2,0.08824319839477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,1,balanced,3.261418660481771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,1,balanced,3.2676852544148765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,1,power_law_1.01,2.115385627746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,1,power_law_1.01,2.152748870849609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,1,power_law_1.2,1.8524288177490233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,1,power_law_1.2,1.9097087860107422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,128,balanced,0.10505066315333049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,128,balanced,0.10552000006039937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,128,power_law_1.01,0.09085440039634704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,128,power_law_1.01,0.10078719854354859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,128,power_law_1.2,0.09557759761810303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,128,power_law_1.2,0.10039039850234985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,16,balanced,0.32602133353551227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,16,balanced,0.32630934317906696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,16,power_law_1.01,0.36129279136657716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,16,power_law_1.01,0.37016959190368653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,16,power_law_1.2,0.36738560199737547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,16,power_law_1.2,0.3679744005203247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,2,balanced,1.683882713317871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,2,balanced,1.6961280504862468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,2,power_law_1.01,1.1628607749938964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,2,power_law_1.01,1.2247679710388184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,2,power_law_1.2,1.148153591156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,2,power_law_1.2,1.1492927551269532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,256,balanced,0.08263466755549113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,256,balanced,0.08319466809431712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,256,power_law_1.01,0.08081279993057251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,256,power_law_1.01,0.08083199858665466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,256,power_law_1.2,0.0807807981967926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,256,power_law_1.2,0.08190720081329346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,32,balanced,0.2232960065205892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,32,balanced,0.22593067089716592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,32,power_law_1.01,0.21434879302978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,32,power_law_1.01,0.21505279541015626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,32,power_law_1.2,0.19735679626464844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,32,power_law_1.2,0.20607359409332277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,4,balanced,0.9075199762980143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,4,balanced,0.9135786692301432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,4,power_law_1.01,0.7543871879577637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,4,power_law_1.01,0.7869952201843262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,4,power_law_1.2,0.7127295970916748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,4,power_law_1.2,0.7418879985809326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,64,balanced,0.1459946632385254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,64,balanced,0.1461013356844584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,64,power_law_1.01,0.13034240007400513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,64,power_law_1.01,0.130457603931427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,64,power_law_1.2,0.1317952036857605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,64,power_law_1.2,0.14199680089950562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,8,balanced,0.5145226716995239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,8,balanced,0.5196160078048706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,8,power_law_1.01,0.5509696006774902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,8,power_law_1.01,0.6099775791168213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,8,power_law_1.2,0.5679488182067871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,1,8,power_law_1.2,0.5685503959655762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,16,1,balanced,0.9744266668955485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,16,1,balanced,0.9747680028279623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,16,1,power_law_1.01,0.6301695823669433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,16,1,power_law_1.01,0.651801586151123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,16,1,power_law_1.2,0.5815552234649658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,16,1,power_law_1.2,0.591264009475708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,2,1,balanced,1.6348533630371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,2,1,balanced,1.643631935119629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,2,1,power_law_1.01,1.0789631843566894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,2,1,power_law_1.01,1.0949312210083009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,2,1,power_law_1.2,0.9575167655944824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,2,1,power_law_1.2,0.9948224067687989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,32,1,balanced,0.8101973533630371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,32,1,balanced,0.813162644704183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,32,1,power_law_1.01,0.5242815971374511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,32,1,power_law_1.01,0.541811180114746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,32,1,power_law_1.2,0.4956992149353027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,32,1,power_law_1.2,0.49683198928833006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,4,1,balanced,0.9449866612752279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,4,1,balanced,0.9452106952667236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,4,1,power_law_1.01,0.6342976093292236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,4,1,power_law_1.01,0.6359424114227294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,4,1,power_law_1.2,0.5737279891967774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,4,1,power_law_1.2,0.5744703769683838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,8,1,balanced,0.5493919849395752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,8,1,balanced,0.5508053302764893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,8,1,power_law_1.01,0.3666815996170044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,8,1,power_law_1.01,0.37368319034576414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,8,1,power_law_1.2,0.33714559078216555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,4096,2688,22,512,8,1,power_law_1.2,0.34277119636535647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,1,balanced,0.7171200116475424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,1,balanced,0.7177066802978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,1,power_law_1.01,0.7211584091186524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,1,power_law_1.01,0.7293695926666259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,1,power_law_1.2,0.6850368022918701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,1,power_law_1.2,0.7047679901123047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,2,balanced,0.3797706762949626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,2,balanced,0.39979732036590576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,2,power_law_1.01,0.3759040117263794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,2,power_law_1.01,0.376857590675354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,2,power_law_1.2,0.37804160118103025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,2,power_law_1.2,0.3791743993759155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,4,balanced,0.22363199790318808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,4,balanced,0.22739734252293906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,4,power_law_1.01,0.22275838851928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,4,power_law_1.01,0.22362239360809327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,4,power_law_1.2,0.22762880325317383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,4,power_law_1.2,0.23050239086151122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,8,balanced,0.1527413328488668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,8,balanced,0.15520000457763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,8,power_law_1.01,0.1505087971687317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,8,power_law_1.01,0.15203839540481567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,8,power_law_1.2,0.15111039876937865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,1,8,power_law_1.2,0.15367039442062377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,16,1,balanced,0.07037866612275441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,16,1,balanced,0.07220800220966339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,16,1,power_law_1.01,0.06908159852027893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,16,1,power_law_1.01,0.06912639737129211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,16,1,power_law_1.2,0.06899200081825256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,16,1,power_law_1.2,0.07017599940299987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,2,1,balanced,0.37489068508148193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,2,1,balanced,0.40518399079640705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,2,1,power_law_1.01,0.37216639518737793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,2,1,power_law_1.01,0.37579519748687745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,2,1,power_law_1.2,0.3699199914932251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,2,1,power_law_1.2,0.3802687883377075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,32,1,balanced,0.05375466744105021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,32,1,balanced,0.054010664423306785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,32,1,power_law_1.01,0.05059840083122254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,32,1,power_law_1.01,0.051052802801132204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,32,1,power_law_1.2,0.05143679976463318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,32,1,power_law_1.2,0.05270400047302246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,4,1,balanced,0.21311465899149576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,4,1,balanced,0.23147199551264444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,4,1,power_law_1.01,0.21167359352111817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,4,1,power_law_1.01,0.2126528024673462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,4,1,power_law_1.2,0.20992000102996827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,4,1,power_law_1.2,0.2142335891723633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,8,1,balanced,0.12781866391499838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,8,1,balanced,0.14285866419474283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,8,1,power_law_1.01,0.12389119863510131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,8,1,power_law_1.01,0.12624000310897826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,8,1,power_law_1.2,0.131494402885437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,16384,2,8,8,1,power_law_1.2,0.13631999492645264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,1,balanced,1.3734666506449382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,1,balanced,1.3756213188171387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,1,power_law_1.01,1.0195903778076172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,1,power_law_1.01,1.029088020324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,1,power_law_1.2,0.9339903831481934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,1,power_law_1.2,0.9342399597167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,128,balanced,0.04970666766166687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,128,balanced,0.04987200101216634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,128,power_law_1.01,0.06272640228271484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,128,power_law_1.01,0.06319360136985779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,128,power_law_1.2,0.06071680188179016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,128,power_law_1.2,0.06336640119552613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,16,balanced,0.14268799622853598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,16,balanced,0.14479999740918478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,16,power_law_1.01,0.20648961067199706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,16,power_law_1.01,0.21133439540863036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,16,power_law_1.2,0.22048640251159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,16,power_law_1.2,0.22079999446868898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,2,balanced,0.7147093613942465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,2,balanced,0.7167999744415283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,2,power_law_1.01,0.5824448108673096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,2,power_law_1.01,0.6162240028381347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,2,power_law_1.2,0.5797952175140381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,2,power_law_1.2,0.5995584011077881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,256,balanced,0.049626668294270836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,256,balanced,0.04985066751639048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,256,power_law_1.01,0.04710400104522705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,256,power_law_1.01,0.04750719964504242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,256,power_law_1.2,0.04747520089149475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,256,power_law_1.2,0.04769279956817627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,32,balanced,0.08413333694140117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,32,balanced,0.08462933699289958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,32,power_law_1.01,0.12665599584579468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,32,power_law_1.01,0.12866560220718384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,32,power_law_1.2,0.11672320365905761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,32,power_law_1.2,0.11906559467315674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,4,balanced,0.3782506783803304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,4,balanced,0.3798240025838216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,4,power_law_1.01,0.37681920528411866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,4,power_law_1.01,0.4274432182312012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,4,power_law_1.2,0.3960832118988037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,4,power_law_1.2,0.4332287788391113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,64,balanced,0.06396799782911937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,64,balanced,0.06630933284759521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,64,power_law_1.01,0.07432320117950439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,64,power_law_1.01,0.0782975971698761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,64,power_law_1.2,0.0710207998752594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,64,power_law_1.2,0.07704319953918456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,8,balanced,0.22218134005864462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,8,balanced,0.2233546574910482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,8,power_law_1.01,0.30300159454345704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,8,power_law_1.01,0.32807040214538574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,8,power_law_1.2,0.3011840105056763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,1,8,power_law_1.2,0.3172032117843628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,16,1,balanced,0.19056532780329385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,16,1,balanced,0.19157866636912027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,16,1,power_law_1.01,0.1360703945159912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,16,1,power_law_1.01,0.13640960454940795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,16,1,power_law_1.2,0.1257024049758911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,16,1,power_law_1.2,0.12660479545593262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,2,1,balanced,0.7236639658610026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,2,1,balanced,0.7257493336995443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,2,1,power_law_1.01,0.5432703971862793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,2,1,power_law_1.01,0.5654592037200927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,2,1,power_law_1.2,0.48696317672729494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,2,1,power_law_1.2,0.4877312183380127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,32,1,balanced,0.1451573371887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,32,1,balanced,0.1460640033086141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,32,1,power_law_1.01,0.11743999719619751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,32,1,power_law_1.01,0.1190335988998413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,32,1,power_law_1.2,0.11006720066070556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,32,1,power_law_1.2,0.11125119924545288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,4,1,balanced,0.4017599821090698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,4,1,balanced,0.40343467394510907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,4,1,power_law_1.01,0.312940788269043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,4,1,power_law_1.01,0.3129983901977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,4,1,power_law_1.2,0.28370559215545654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,4,1,power_law_1.2,0.29154560565948484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,8,1,balanced,0.26082666714986164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,8,1,balanced,0.26261866092681885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,8,1,power_law_1.01,0.19457279443740844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,8,1,power_law_1.01,0.2002432107925415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,8,1,power_law_1.2,0.17900799512863158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2048,8,256,8,1,power_law_1.2,0.1835904002189636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,1,balanced,1.702799956003825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,1,balanced,1.7057813008626301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,1,power_law_1.01,1.0095808029174804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,1,power_law_1.01,1.026585578918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,1,power_law_1.2,0.8715007781982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,1,power_law_1.2,0.8995200157165527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,16,balanced,0.15288533767064413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,16,balanced,0.15338666240374246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,16,power_law_1.01,0.13642879724502563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,16,power_law_1.01,0.1406272053718567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,16,power_law_1.2,0.12498559951782226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,16,power_law_1.2,0.1408511996269226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,2,balanced,0.8762826919555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,2,balanced,0.8782133261362711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,2,power_law_1.01,0.572870397567749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,2,power_law_1.01,0.5979392051696777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,2,power_law_1.2,0.5634431838989258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,2,power_law_1.2,0.5716864109039307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,32,balanced,0.09295466542243958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,32,balanced,0.09417066971460979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,32,power_law_1.01,0.08969600200653076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,32,power_law_1.01,0.103603196144104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,32,power_law_1.2,0.08140159845352173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,32,power_law_1.2,0.09258880019187928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,4,balanced,0.45996801058451336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,4,balanced,0.4601653416951497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,4,power_law_1.01,0.3279680013656616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,4,power_law_1.01,0.36584959030151365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,4,power_law_1.2,0.32429440021514894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,4,power_law_1.2,0.341158390045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,8,balanced,0.2505333423614502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,8,balanced,0.25195199251174927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,8,power_law_1.01,0.26382079124450686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,8,power_law_1.01,0.2686527967453003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,8,power_law_1.2,0.1994047999382019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,1,8,power_law_1.2,0.23366398811340333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,16,1,balanced,0.2183039983113607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,16,1,balanced,0.21928532918294272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,16,1,power_law_1.01,0.1339136004447937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,16,1,power_law_1.01,0.13496320247650145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,16,1,power_law_1.2,0.12391040325164795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,16,1,power_law_1.2,0.12983039617538453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,2,1,balanced,0.8746026357014974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,2,1,balanced,0.8760000069936117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,2,1,power_law_1.01,0.49784321784973146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,2,1,power_law_1.01,0.5327744007110595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,2,1,power_law_1.2,0.4924928188323975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,2,1,power_law_1.2,0.4977536201477051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,32,1,balanced,0.15467199683189392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,32,1,balanced,0.15472533305486044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,32,1,power_law_1.01,0.10572799444198608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,32,1,power_law_1.01,0.10643839836120605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,32,1,power_law_1.2,0.09496319890022278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,32,1,power_law_1.2,0.09950720071792603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,4,1,balanced,0.48051198323567706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,4,1,balanced,0.4914613167444865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,4,1,power_law_1.01,0.29755520820617676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,4,1,power_law_1.01,0.3038975954055786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,4,1,power_law_1.2,0.280076789855957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,4,1,power_law_1.2,0.2814079999923706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,8,1,balanced,0.29397332668304443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,8,1,balanced,0.2948213418324788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,8,1,power_law_1.01,0.18520959615707397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,8,1,power_law_1.01,0.19237760305404664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,8,1,power_law_1.2,0.17686400413513184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,6144,2560,8,160,8,1,power_law_1.2,0.17748479843139647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,1,balanced,1.5968106587727864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,1,balanced,1.5976640383402507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,1,power_law_1.01,1.2179136276245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,1,power_law_1.01,1.2276800155639649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,1,power_law_1.2,1.0677375793457031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,1,power_law_1.2,1.0996031761169434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,128,balanced,0.05491200089454651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,128,balanced,0.05596266686916351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,128,power_law_1.01,0.06940159797668458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,128,power_law_1.01,0.07066239714622498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,128,power_law_1.2,0.06962559819221496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,128,power_law_1.2,0.069760000705719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,16,balanced,0.16200000047683716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,16,balanced,0.1649493376413981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,16,power_law_1.01,0.23916161060333252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,16,power_law_1.01,0.25217280387878416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,16,power_law_1.2,0.2542272090911865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,16,power_law_1.2,0.25471360683441163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,2,balanced,0.8309546311696371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,2,balanced,0.8333706855773926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,2,power_law_1.01,0.6845952033996582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,2,power_law_1.01,0.7074111938476563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,2,power_law_1.2,0.6722303867340088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,2,power_law_1.2,0.6816319942474365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,256,balanced,0.05539200206597646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,256,balanced,0.05611733098824819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,256,power_law_1.01,0.054713600873947145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,256,power_law_1.01,0.054745602607727054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,256,power_law_1.2,0.055129599571228025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,256,power_law_1.2,0.05546879768371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,32,balanced,0.09582933783531189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,32,balanced,0.09596799810727437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,32,power_law_1.01,0.1344063997268677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,32,power_law_1.01,0.13509119749069215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,32,power_law_1.2,0.12563199996948243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,32,power_law_1.2,0.14965759515762328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,4,balanced,0.4355039993921916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,4,balanced,0.4368480046590169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,4,power_law_1.01,0.49050240516662597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,4,power_law_1.01,0.5080959796905518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,4,power_law_1.2,0.41448321342468264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,4,power_law_1.2,0.463424015045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,64,balanced,0.07223999996980031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,64,balanced,0.07233066856861115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,64,power_law_1.01,0.08271359801292419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,64,power_law_1.01,0.08967679738998413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,64,power_law_1.2,0.07848320007324219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,64,power_law_1.2,0.07947520017623902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,8,balanced,0.25435733795166016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,8,balanced,0.27137066920598346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,8,power_law_1.01,0.36757760047912597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,8,power_law_1.01,0.378656005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,8,power_law_1.2,0.3785599946975708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,1,8,power_law_1.2,0.4002816200256348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,16,1,balanced,0.21812800566355386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,16,1,balanced,0.21851734320322672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,16,1,power_law_1.01,0.15471999645233153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,16,1,power_law_1.01,0.15875200033187867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,16,1,power_law_1.2,0.14383360147476196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,16,1,power_law_1.2,0.14740480184555055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,2,1,balanced,0.8422559897104899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,2,1,balanced,0.8726613521575928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,2,1,power_law_1.01,0.6341567993164062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,2,1,power_law_1.01,0.6358784198760986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,2,1,power_law_1.2,0.5648384094238281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,2,1,power_law_1.2,0.5741759777069092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,32,1,balanced,0.1660426656405131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,32,1,balanced,0.16643200318018594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,32,1,power_law_1.01,0.1339903950691223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,32,1,power_law_1.01,0.13560320138931276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,32,1,power_law_1.2,0.12565120458602905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,32,1,power_law_1.2,0.12654720544815062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,4,1,balanced,0.46323732535044354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,4,1,balanced,0.5023626486460367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,4,1,power_law_1.01,0.36011519432067873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,4,1,power_law_1.01,0.36195199489593505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,4,1,power_law_1.2,0.3159039974212646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,4,1,power_law_1.2,0.3381184101104736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,8,1,balanced,0.30179200569788617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,8,1,balanced,0.30240533749262494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,8,1,power_law_1.01,0.22760961055755616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,8,1,power_law_1.01,0.22832000255584717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,8,1,power_law_1.2,0.20274560451507567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,256,8,1,power_law_1.2,0.2056960105895996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,1,balanced,1.595962683359782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,1,balanced,1.598314603169759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,1,power_law_1.01,1.4556287765502929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,1,power_law_1.01,1.4622400283813477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,1,power_law_1.2,1.3027584075927734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,1,power_law_1.2,1.3151679992675782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,128,balanced,0.055829331278800964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,128,balanced,0.05611200133959452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,128,power_law_1.01,0.07477759718894958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,128,power_law_1.01,0.07664639949798584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,128,power_law_1.2,0.07160959839820862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,128,power_law_1.2,0.0716863989830017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,16,balanced,0.161871999502182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,16,balanced,0.16609600186347961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,16,power_law_1.01,0.3388479948043823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,16,power_law_1.01,0.34323840141296386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,16,power_law_1.2,0.3424704074859619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,16,power_law_1.2,0.34282240867614744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,2,balanced,0.8347040017445883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,2,balanced,0.8501173655192057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,2,power_law_1.01,0.8860287666320801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,2,power_law_1.01,0.9201343536376954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,2,power_law_1.2,0.7911424160003662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,2,power_law_1.2,0.817471981048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,32,balanced,0.09705066680908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,32,balanced,0.09714133540789287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,32,power_law_1.01,0.19102079868316652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,32,power_law_1.01,0.19242240190505983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,32,power_law_1.2,0.19015040397644042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,32,power_law_1.2,0.1924415946006775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,4,balanced,0.4362613360087077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,4,balanced,0.4375306765238444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,4,power_law_1.01,0.6088575839996337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,4,power_law_1.01,0.6381631851196289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,4,power_law_1.2,0.5292799949645997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,4,power_law_1.2,0.6047296047210693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,64,balanced,0.07064533233642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,64,balanced,0.07208533088366191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,64,power_law_1.01,0.1132159948348999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,64,power_law_1.01,0.11383039951324463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,64,power_law_1.2,0.1059391975402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,64,power_law_1.2,0.10689280033111573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,8,balanced,0.255349338054657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,8,balanced,0.25989333788553876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,8,power_law_1.01,0.4787456035614014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,8,power_law_1.01,0.49790081977844236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,8,power_law_1.2,0.4614399909973145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,1,8,power_law_1.2,0.5063168048858643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,16,1,balanced,0.21846934159596762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,16,1,balanced,0.22687999407450357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,16,1,power_law_1.01,0.19096319675445556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,16,1,power_law_1.01,0.2012864112854004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,16,1,power_law_1.2,0.16510080099105834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,16,1,power_law_1.2,0.16624000072479247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,2,1,balanced,0.8452426592508951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,2,1,balanced,0.8483359813690186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,2,1,power_law_1.01,0.7393792152404786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,2,1,power_law_1.01,0.7601344108581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,2,1,power_law_1.2,0.6845952033996582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,2,1,power_law_1.2,0.6958335876464844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,32,1,balanced,0.1670666734377543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,32,1,balanced,0.16781866550445557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,32,1,power_law_1.01,0.15320320129394532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,32,1,power_law_1.01,0.15813119411468507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,32,1,power_law_1.2,0.14232319593429565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,32,1,power_law_1.2,0.1428544044494629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,4,1,balanced,0.46315733591715497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,4,1,balanced,0.47992531458536786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,4,1,power_law_1.01,0.41468157768249514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,4,1,power_law_1.01,0.42795519828796386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,4,1,power_law_1.2,0.380511999130249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,4,1,power_law_1.2,0.38426880836486815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,8,1,balanced,0.3017386595408122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,8,1,balanced,0.3023359974225362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,8,1,power_law_1.01,0.2750080108642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,8,1,power_law_1.01,0.27818880081176756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,8,1,power_law_1.2,0.23928320407867432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16,7168,2048,8,384,8,1,power_law_1.2,0.24150400161743163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,1,balanced,0.21108800172805786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,1,balanced,0.2113813360532125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,1,power_law_1.01,0.21274878978729247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,1,power_law_1.01,0.21432321071624755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,1,power_law_1.2,0.21771519184112548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,1,power_law_1.2,0.21906559467315673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,128,balanced,0.04688533147176107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,128,balanced,0.047168001532554626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,128,power_law_1.01,0.043398401141166686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,128,power_law_1.01,0.043647998571395875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,128,power_law_1.2,0.04490880072116852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,128,power_law_1.2,0.04583680033683777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,16,balanced,0.05226666728655497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,16,balanced,0.05583466589450836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,16,power_law_1.01,0.04885759949684143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,16,power_law_1.01,0.05167999863624573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,16,power_law_1.2,0.051769602298736575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,16,power_law_1.2,0.05403519868850708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,2,balanced,0.13431466619173685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,2,balanced,0.14069333672523499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,2,power_law_1.01,0.1302783966064453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,2,power_law_1.01,0.13122559785842897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,2,power_law_1.2,0.12888959646224976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,2,power_law_1.2,0.1327232003211975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,32,balanced,0.04593066871166229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,32,balanced,0.045935998360315956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,32,power_law_1.01,0.04483200013637543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,32,power_law_1.01,0.045075199007987975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,32,power_law_1.2,0.04478079974651337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,32,power_law_1.2,0.04508160054683685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,4,balanced,0.08916266759236653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,4,balanced,0.08961600065231323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,4,power_law_1.01,0.08584960103034973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,4,power_law_1.01,0.08668799996376038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,4,power_law_1.2,0.08475520014762879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,4,power_law_1.2,0.0865343987941742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,64,balanced,0.045824001232783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,64,balanced,0.04665066798528036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,64,power_law_1.01,0.04343039989471435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,64,power_law_1.01,0.04397439956665039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,64,power_law_1.2,0.04387840032577515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,64,power_law_1.2,0.044684800505638125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,8,balanced,0.0662613312403361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,8,balanced,0.06637866795063019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,8,power_law_1.01,0.06447359919548035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,8,power_law_1.01,0.06573439836502075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,8,power_law_1.2,0.06521599888801574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,1,8,power_law_1.2,0.0662335991859436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,2,1,balanced,0.1337279975414276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,2,1,balanced,0.13414399822553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,2,1,power_law_1.01,0.12654720544815062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,2,1,power_law_1.01,0.12857600450515747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,2,1,power_law_1.2,0.12849279642105102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,2,1,power_law_1.2,0.129312002658844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,4,1,balanced,0.08796800176302592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,4,1,balanced,0.08927466471989949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,4,1,power_law_1.01,0.08328959941864014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,4,1,power_law_1.01,0.0835968017578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,4,1,power_law_1.2,0.08389120101928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2048,768,8,128,4,1,power_law_1.2,0.08521599769592285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,1,balanced,0.5880266825358073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,1,balanced,0.5921493371327718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,1,power_law_1.01,0.5396863937377929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,1,power_law_1.01,0.5598591804504395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,1,power_law_1.2,0.5808127880096435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,1,power_law_1.2,0.5836544036865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,128,balanced,0.06117866436640421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,128,balanced,0.06228266656398773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,128,power_law_1.01,0.06024320125579834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,128,power_law_1.01,0.06037759780883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,128,power_law_1.2,0.06028159856796265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,128,power_law_1.2,0.06077439785003662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,16,balanced,0.08238400022188823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,16,balanced,0.08238933483759563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,16,power_law_1.01,0.07872639894485474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,16,power_law_1.01,0.07969279885292054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,16,power_law_1.2,0.08004480004310607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,16,power_law_1.2,0.08034560084342957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,2,balanced,0.3571679989496867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,2,balanced,0.361194650332133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,2,power_law_1.01,0.3141119956970215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,2,power_law_1.01,0.3242815971374512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,2,power_law_1.2,0.3096191883087158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,2,power_law_1.2,0.32583041191101075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,32,balanced,0.07175466914971669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,32,balanced,0.07284266750017802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,32,power_law_1.01,0.06872959733009339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,32,power_law_1.01,0.07011839747428894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,32,power_law_1.2,0.07052159905433655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,32,power_law_1.2,0.07079039812088013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,4,balanced,0.20579200983047485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,4,balanced,0.20685333013534546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,4,power_law_1.01,0.18145279884338378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,4,power_law_1.01,0.19271680116653442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,4,power_law_1.2,0.18421119451522827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,4,power_law_1.2,0.19752960205078124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,64,balanced,0.06284266710281372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,64,balanced,0.06297599772612254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,64,power_law_1.01,0.0606719970703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,64,power_law_1.01,0.061926400661468504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,64,power_law_1.2,0.06034560203552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,64,power_law_1.2,0.06082559823989868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,8,balanced,0.12876266241073608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,8,balanced,0.13014400005340576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,8,power_law_1.01,0.11375999450683594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,8,power_law_1.01,0.12200959920883178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,8,power_law_1.2,0.11587200164794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,1,8,power_law_1.2,0.12355200052261353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,16,1,balanced,0.21917333205540976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,16,1,balanced,0.21991999944051108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,16,1,power_law_1.01,0.19957760572433472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,16,1,power_law_1.01,0.20018560886383058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,16,1,power_law_1.2,0.20851199626922606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,16,1,power_law_1.2,0.20940160751342773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,2,1,balanced,0.3478240172068278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,2,1,balanced,0.34929601351420086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,2,1,power_law_1.01,0.3137216091156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,2,1,power_law_1.01,0.3145087957382202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,2,1,power_law_1.2,0.32119040489196776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,2,1,power_law_1.2,0.32213120460510253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,32,1,balanced,0.18751466274261475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,32,1,balanced,0.18762133518854776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,32,1,power_law_1.01,0.16926079988479614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,32,1,power_law_1.01,0.17274240255355836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,32,1,power_law_1.2,0.1686784029006958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,32,1,power_law_1.2,0.17393920421600342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,4,1,balanced,0.2037280003229777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,4,1,balanced,0.2055893341700236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,4,1,power_law_1.01,0.18436479568481445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,4,1,power_law_1.01,0.19084800481796266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,4,1,power_law_1.2,0.19533439874649047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,4,1,power_law_1.2,0.19702399969100953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,8,1,balanced,0.3212053378423055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,8,1,balanced,0.32235199213027954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,8,1,power_law_1.01,0.2905535936355591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,8,1,power_law_1.01,0.30212481021881105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,8,1,power_law_1.2,0.3002559900283813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,2688,1856,6,128,8,1,power_law_1.2,0.30323200225830077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,1,balanced,1.1594399611155193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,1,balanced,1.1642026901245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,1,power_law_1.01,0.9486847877502441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,1,power_law_1.01,0.9922112464904785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,1,power_law_1.2,0.9592127799987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,1,power_law_1.2,0.9764800071716309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,128,balanced,0.0927946666876475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,128,balanced,0.0932426651318868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,128,power_law_1.01,0.09182720184326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,128,power_law_1.01,0.0920960009098053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,128,power_law_1.2,0.09257599711418152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,128,power_law_1.2,0.09300479888916016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,16,balanced,0.15219733119010925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,16,balanced,0.15364799896876016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,16,power_law_1.01,0.1364799976348877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,16,power_law_1.01,0.14217599630355834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,16,power_law_1.2,0.1357632040977478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,16,power_law_1.2,0.13976320028305053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,2,balanced,0.6119253238042196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,2,balanced,0.6159786780675253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,2,power_law_1.01,0.5454271793365478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,2,power_law_1.01,0.5570879936218261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,2,power_law_1.2,0.5035071849822998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,2,power_law_1.2,0.50447998046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,256,balanced,0.0928053359190623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,256,balanced,0.09461333354314168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,256,power_law_1.01,0.09185280203819275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,256,power_law_1.01,0.09220479726791382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,256,power_law_1.2,0.09187840223312378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,256,power_law_1.2,0.09208959937095643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,32,balanced,0.10897599657376607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,32,balanced,0.11030933260917664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,32,power_law_1.01,0.10474879741668701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,32,power_law_1.01,0.1058303952217102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,32,power_law_1.2,0.10574719905853272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,32,power_law_1.2,0.10658559799194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,4,balanced,0.35203198591868085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,4,balanced,0.3555519978205363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,4,power_law_1.01,0.3114304065704346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,4,power_law_1.01,0.3120703935623169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,4,power_law_1.2,0.313971209526062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,4,power_law_1.2,0.32150399684906006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,64,balanced,0.0995840032895406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,64,balanced,0.09993066390355428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,64,power_law_1.01,0.09812480211257935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,64,power_law_1.01,0.09843199849128723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,64,power_law_1.2,0.09754239916801452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,64,power_law_1.2,0.09818879961967468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,8,balanced,0.21412267287572226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,8,balanced,0.2178666591644287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,8,power_law_1.01,0.19701119661331176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,8,power_law_1.01,0.19981440305709838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,8,power_law_1.2,0.19479680061340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,1,8,power_law_1.2,0.20129919052124023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,16,1,balanced,0.16325866182645163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,16,1,balanced,0.16382933656374613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,16,1,power_law_1.01,0.13127679824829103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,16,1,power_law_1.01,0.14032000303268433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,16,1,power_law_1.2,0.13112959861755372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,16,1,power_law_1.2,0.13143680095672608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,2,1,balanced,0.5987626711527506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,2,1,balanced,0.6014453172683716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,2,1,power_law_1.01,0.5036416053771973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,2,1,power_law_1.01,0.5061503887176514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,2,1,power_law_1.2,0.5089280128479003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,2,1,power_law_1.2,0.5099775791168213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,32,1,balanced,0.11967999736467998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,32,1,balanced,0.12026133139928182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,32,1,power_law_1.01,0.11055359840393067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,32,1,power_law_1.01,0.11210240125656128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,32,1,power_law_1.2,0.11206400394439697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,32,1,power_law_1.2,0.11250560283660889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,4,1,balanced,0.3366933266321818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,4,1,balanced,0.3372746706008911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,4,1,power_law_1.01,0.2823807954788208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,4,1,power_law_1.01,0.28431360721588134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,4,1,power_law_1.2,0.2845439910888672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,4,1,power_law_1.2,0.30023679733276365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,8,1,balanced,0.20456000169118246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,8,1,balanced,0.20508267482121786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,8,1,power_law_1.01,0.18540159463882447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,8,1,power_law_1.01,0.18584320545196534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,8,1,power_law_1.2,0.1851263999938965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,3072,1536,8,256,8,1,power_law_1.2,0.18558080196380616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,1,balanced,0.5119733413060507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,1,balanced,0.5131093263626099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,1,power_law_1.01,0.5570176124572754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,1,power_law_1.01,0.5657663822174073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,1,power_law_1.2,0.5730624198913574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,1,power_law_1.2,0.5776832103729248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,2,balanced,0.33847999572753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,2,balanced,0.3386559883753459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,2,power_law_1.01,0.36867198944091795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,2,power_law_1.01,0.377836799621582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,2,power_law_1.2,0.36240639686584475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,2,power_law_1.2,0.3717888116836548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,4,balanced,0.25549866755803424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,4,balanced,0.2593226631482442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,4,power_law_1.01,0.26150400638580323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,4,power_law_1.01,0.2808768033981323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,4,power_law_1.2,0.28211839199066163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,4,power_law_1.2,0.2957119941711426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,8,balanced,0.21146132548650107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,8,balanced,0.2191093365351359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,8,power_law_1.01,0.23208320140838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,8,power_law_1.01,0.23393919467926025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,8,power_law_1.2,0.23101439476013183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,1,8,power_law_1.2,0.23350400924682618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,16,1,balanced,0.07442666590213776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,16,1,balanced,0.07595733304818471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,16,1,power_law_1.01,0.07500159740447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,16,1,power_law_1.01,0.07594879865646362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,16,1,power_law_1.2,0.07537279725074768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,16,1,power_law_1.2,0.07612800002098083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,2,1,balanced,0.28310932715733844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,2,1,balanced,0.28551467259724933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,2,1,power_law_1.01,0.28556160926818847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,2,1,power_law_1.01,0.29033598899841306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,2,1,power_law_1.2,0.2849087953567505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,2,1,power_law_1.2,0.29482879638671877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,32,1,balanced,0.05784533421198527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,32,1,balanced,0.06016000111897787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,32,1,power_law_1.01,0.06368640065193176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,32,1,power_law_1.01,0.0641152024269104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,32,1,power_law_1.2,0.06229119896888733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,32,1,power_law_1.2,0.06362879872322083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,4,1,balanced,0.17179733514785767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,4,1,balanced,0.17352000872294107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,4,1,power_law_1.01,0.16711039543151857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,4,1,power_law_1.01,0.1700160026550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,4,1,power_law_1.2,0.16714240312576295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,4,1,power_law_1.2,0.1684991955757141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,8,1,balanced,0.09706667065620422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,8,1,balanced,0.10106133421262105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,8,1,power_law_1.01,0.0967743992805481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,8,1,power_law_1.01,0.09758719801902771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,8,1,power_law_1.2,0.09770879745483399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,14336,2,8,8,1,power_law_1.2,0.09863680005073547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,1,balanced,0.7797973155975342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,1,balanced,0.7824479738871256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,1,power_law_1.01,0.7497024059295654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,1,power_law_1.01,0.751692819595337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,1,power_law_1.2,0.7509503841400147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,1,power_law_1.2,0.7685376167297363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,128,balanced,0.07689600189526875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,128,balanced,0.07771733403205872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,128,power_law_1.01,0.07071359753608704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,128,power_law_1.01,0.07301120162010193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,128,power_law_1.2,0.074508798122406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,128,power_law_1.2,0.07605760097503662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,16,balanced,0.10710400342941284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,16,balanced,0.10730666915575664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,16,power_law_1.01,0.10361599922180176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,16,power_law_1.01,0.10423040390014648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,16,power_law_1.2,0.1045375943183899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,16,power_law_1.2,0.1061568021774292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,2,balanced,0.42664531866709393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,2,balanced,0.4282453457514445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,2,power_law_1.01,0.41516799926757814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,2,power_law_1.01,0.4231935977935791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,2,power_law_1.2,0.4198783874511719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,2,power_law_1.2,0.4228352069854736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,32,balanced,0.09308800101280212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,32,balanced,0.0935040016969045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,32,power_law_1.01,0.09173759818077087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,32,power_law_1.01,0.09214720129966736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,32,power_law_1.2,0.09210240244865417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,32,power_law_1.2,0.09251840114593506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,4,balanced,0.24239999055862427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,4,balanced,0.24421866734822592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,4,power_law_1.01,0.23800959587097167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,4,power_law_1.01,0.23919360637664794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,4,power_law_1.2,0.2412992000579834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,4,power_law_1.2,0.24238719940185546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,64,balanced,0.08477866649627686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,64,balanced,0.08486933509508769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,64,power_law_1.01,0.08173440098762512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,64,power_law_1.01,0.0832256019115448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,64,power_law_1.2,0.08553599715232849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,64,power_law_1.2,0.08562560081481933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,8,balanced,0.15466666221618652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,8,balanced,0.15526400009791055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,8,power_law_1.01,0.14926079511642457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,8,power_law_1.01,0.1494976043701172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,8,power_law_1.2,0.14940160512924194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,1,8,power_law_1.2,0.1498944044113159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,16,1,balanced,0.11748266220092773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,16,1,balanced,0.11962133646011353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,16,1,power_law_1.01,0.11384960412979125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,16,1,power_law_1.01,0.11424000263214111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,16,1,power_law_1.2,0.11512960195541382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,16,1,power_law_1.2,0.1151360034942627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,2,1,balanced,0.39175466696421307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,2,1,balanced,0.3954399824142456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,2,1,power_law_1.01,0.3910975933074951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,2,1,power_law_1.01,0.4018303871154785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,2,1,power_law_1.2,0.4031231880187988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,2,1,power_law_1.2,0.4064320087432861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,32,1,balanced,0.10286399722099304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,32,1,balanced,0.10466133554776509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,32,1,power_law_1.01,0.10062079429626465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,32,1,power_law_1.01,0.10081280469894409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,32,1,power_law_1.2,0.10158079862594604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,32,1,power_law_1.2,0.10172159671783447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,4,1,balanced,0.23468265930811563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,4,1,balanced,0.23484800259272257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,4,1,power_law_1.01,0.22476160526275635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,4,1,power_law_1.01,0.2248255968093872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,4,1,power_law_1.2,0.22583680152893065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,4,1,power_law_1.2,0.22933759689331054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,8,1,balanced,0.15035733580589294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,8,1,balanced,0.15038399895032248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,8,1,power_law_1.01,0.14204800128936768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,8,1,power_law_1.01,0.14383360147476196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,8,1,power_law_1.2,0.14266879558563234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,1536,8,128,8,1,power_law_1.2,0.14292479753494264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,1,balanced,5.249423980712891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,1,balanced,5.261082649230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,1,power_law_1.01,4.640351867675781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,1,power_law_1.01,4.656159973144531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,1,power_law_1.2,4.8464000701904295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,1,power_law_1.2,4.984000015258789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,128,balanced,0.2772746682167053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,128,balanced,0.27859199047088623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,128,power_law_1.01,0.2750720024108887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,128,power_law_1.01,0.27696640491485597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,128,power_law_1.2,0.2751744031906128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,128,power_law_1.2,0.27525761127471926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,16,balanced,0.5779626766840616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,16,balanced,0.5782560110092163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,16,power_law_1.01,0.5479936122894287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,16,power_law_1.01,0.5490431785583496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,16,power_law_1.2,0.5500095844268799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,16,power_law_1.2,0.5503039836883545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,2,balanced,2.722618738810221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,2,balanced,2.810624122619629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,2,power_law_1.01,2.4129600524902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,2,power_law_1.01,2.4593599319458006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,2,power_law_1.2,2.5133312225341795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,2,power_law_1.2,2.5312576293945312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,256,balanced,0.266757329305013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,256,balanced,0.26899200677871704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,256,power_law_1.01,0.26565120220184324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,256,power_law_1.01,0.26672000885009767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,256,power_law_1.2,0.2666559934616089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,256,power_law_1.2,0.26695680618286133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,32,balanced,0.41017599900563556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,32,balanced,0.41495998700459796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,32,power_law_1.01,0.3994175910949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,32,power_law_1.01,0.4006336212158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,32,power_law_1.2,0.4014848232269287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,32,power_law_1.2,0.4070784091949463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,4,balanced,1.4955253601074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,4,balanced,1.502522627512614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,4,power_law_1.01,1.353932762145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,4,power_law_1.01,1.3582783699035645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,4,power_law_1.2,1.3611328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,4,power_law_1.2,1.3913472175598145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,64,balanced,0.3121280074119568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,64,balanced,0.3123253385225932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,64,power_law_1.01,0.3062272071838379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,64,power_law_1.01,0.3102976083755493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,64,power_law_1.2,0.3054975986480713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,64,power_law_1.2,0.3069119930267334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,8,balanced,0.8816533088684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,8,balanced,0.8827786445617676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,8,power_law_1.01,0.8073856353759765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,8,power_law_1.01,0.841312026977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,8,power_law_1.2,0.8168831825256347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,1,8,power_law_1.2,0.8263999938964843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,16,1,balanced,1.4458667437235515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,16,1,balanced,1.4484532674153645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,16,1,power_law_1.01,1.2981632232666016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,16,1,power_law_1.01,1.3186944007873536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,16,1,power_law_1.2,1.3081727981567384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,16,1,power_law_1.2,1.3091008186340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,2,1,balanced,2.479109287261963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,2,1,balanced,2.482954661051432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,2,1,power_law_1.01,2.21964168548584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,2,1,power_law_1.01,2.2462783813476563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,2,1,power_law_1.2,2.2678144454956053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,2,1,power_law_1.2,2.2909311294555663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,32,1,balanced,1.1413119633992512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,32,1,balanced,1.142143964767456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,32,1,power_law_1.01,1.0214271545410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,32,1,power_law_1.01,1.0217663764953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,32,1,power_law_1.2,1.0548352241516112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,32,1,power_law_1.2,1.0552255630493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,4,1,balanced,1.3827625910441081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,4,1,balanced,1.3858933448791504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,4,1,power_law_1.01,1.2613887786865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,4,1,power_law_1.01,1.2633536338806153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,4,1,power_law_1.2,1.292684841156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,4,1,power_law_1.2,1.301689624786377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,8,1,balanced,0.772816022237142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,8,1,balanced,0.7776426474253336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,8,1,power_law_1.01,0.7067903995513916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,8,1,power_law_1.01,0.7090112209320069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,8,1,power_law_1.2,0.7236735820770264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,4096,2688,22,512,8,1,power_law_1.2,0.7251520156860352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,1,balanced,0.798688014348348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,1,balanced,0.7994399865468343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,1,power_law_1.01,0.9818495750427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,1,power_law_1.01,1.0160063743591308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,1,power_law_1.2,0.9922112464904785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,1,power_law_1.2,1.0453248023986816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,2,balanced,0.4827306667963664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,2,balanced,0.48447998364766437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,2,power_law_1.01,0.5487040042877197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,2,power_law_1.01,0.5812416076660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,2,power_law_1.2,0.558016014099121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,2,power_law_1.2,0.5596223831176758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,4,balanced,0.3362720012664795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,4,balanced,0.3396159807840983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,4,power_law_1.01,0.38667519092559816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,4,power_law_1.01,0.38755199909210203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,4,power_law_1.2,0.4048768043518066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,4,power_law_1.2,0.41321601867675783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,8,balanced,0.26475733518600464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,8,balanced,0.26626133918762207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,8,power_law_1.01,0.29875199794769286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,8,power_law_1.01,0.3007744073867798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,8,power_law_1.2,0.2988352060317993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,1,8,power_law_1.2,0.2990592002868652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,16,1,balanced,0.10175999999046326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,16,1,balanced,0.10288000106811523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,16,1,power_law_1.01,0.10839040279388427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,16,1,power_law_1.01,0.11041280031204223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,16,1,power_law_1.2,0.10973440408706665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,16,1,power_law_1.2,0.11055359840393067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,2,1,balanced,0.43721067905426025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,2,1,balanced,0.43859732151031494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,2,1,power_law_1.01,0.4869120121002197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,2,1,power_law_1.01,0.5069119930267334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,2,1,power_law_1.2,0.47505922317504884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,2,1,power_law_1.2,0.4879487991333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,32,1,balanced,0.08751466870307922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,32,1,balanced,0.08890666564305623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,32,1,power_law_1.01,0.09131519794464112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,32,1,power_law_1.01,0.09162240028381348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,32,1,power_law_1.2,0.08991360068321227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,32,1,power_law_1.2,0.09080960154533387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,4,1,balanced,0.2531306743621826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,4,1,balanced,0.25693867603937787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,4,1,power_law_1.01,0.26903040409088136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,4,1,power_law_1.01,0.27292799949645996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,4,1,power_law_1.2,0.2752000093460083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,4,1,power_law_1.2,0.2755136013031006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,8,1,balanced,0.13486400246620178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,8,1,balanced,0.1381439963976542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,8,1,power_law_1.01,0.14633599519729615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,8,1,power_law_1.01,0.15029120445251465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,8,1,power_law_1.2,0.14636800289154053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,16384,2,8,8,1,power_law_1.2,0.14824960231781006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,1,balanced,2.9583040873209634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,1,balanced,3.110879898071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,1,power_law_1.01,2.484480094909668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,1,power_law_1.01,2.522323226928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,1,power_law_1.2,2.45034236907959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,1,power_law_1.2,2.4518848419189454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,128,balanced,0.15658133228619894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,128,balanced,0.1583573321501414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,128,power_law_1.01,0.15534720420837403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,128,power_law_1.01,0.15588480234146118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,128,power_law_1.2,0.1544319987297058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,128,power_law_1.2,0.15502079725265502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,16,balanced,0.3167840043703715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,16,balanced,0.31752000252405804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,16,power_law_1.01,0.2929215908050537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,16,power_law_1.01,0.29948160648345945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,16,power_law_1.2,0.2998143911361694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,16,power_law_1.2,0.3065727949142456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,2,balanced,1.5570613543192546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,2,balanced,1.5931520462036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,2,power_law_1.01,1.282374382019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,2,power_law_1.01,1.310540771484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,2,power_law_1.2,1.3114687919616699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,2,power_law_1.2,1.371609592437744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,256,balanced,0.15236799915631613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,256,balanced,0.15272000432014465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,256,power_law_1.01,0.14999680519104003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,256,power_law_1.01,0.15037440061569213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,256,power_law_1.2,0.15086079835891725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,256,power_law_1.2,0.15145599842071533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,32,balanced,0.20331732432047525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,32,balanced,0.20333333810170492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,32,power_law_1.01,0.19731839895248413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,32,power_law_1.01,0.19985920190811157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,32,power_law_1.2,0.1928704023361206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,32,power_law_1.2,0.19454079866409302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,4,balanced,0.8339040279388428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,4,balanced,0.8347787062327067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,4,power_law_1.01,0.714515209197998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,4,power_law_1.01,0.7436223983764648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,4,power_law_1.2,0.7219903945922852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,4,power_law_1.2,0.7862592220306397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,64,balanced,0.16502400239308676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,64,balanced,0.16567466656366983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,64,power_law_1.01,0.16201599836349487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,64,power_law_1.01,0.16355839967727662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,64,power_law_1.2,0.16189440488815307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,64,power_law_1.2,0.1631999969482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,8,balanced,0.48865067958831787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,8,balanced,0.49118932088216144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,8,power_law_1.01,0.4388671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,8,power_law_1.01,0.45397119522094725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,8,power_law_1.2,0.4469503879547119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,1,8,power_law_1.2,0.4616960048675537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,16,1,balanced,0.32261866331100464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,16,1,balanced,0.32340800762176514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,16,1,power_law_1.01,0.2591423988342285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,16,1,power_law_1.01,0.2684992074966431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,16,1,power_law_1.2,0.2563391923904419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,16,1,power_law_1.2,0.25673599243164064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,2,1,balanced,1.5416213671366374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,2,1,balanced,1.5444213549296062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,2,1,power_law_1.01,1.3089983940124512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,2,1,power_law_1.01,1.3094400405883788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,2,1,power_law_1.2,1.2676799774169922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,2,1,power_law_1.2,1.2926783561706543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,32,1,balanced,0.22330133120218912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,32,1,balanced,0.22331732511520386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,32,1,power_law_1.01,0.20551679134368897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,32,1,power_law_1.01,0.20581119060516356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,32,1,power_law_1.2,0.20584321022033691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,32,1,power_law_1.2,0.206496000289917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,4,1,balanced,0.7978400389353434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,4,1,balanced,0.7996746699015299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,4,1,power_law_1.01,0.6780352115631103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,4,1,power_law_1.01,0.6961919784545898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,4,1,power_law_1.2,0.6751999855041504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,4,1,power_law_1.2,0.6974271774291992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,8,1,balanced,0.47062400976816815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,8,1,balanced,0.4724213282267253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,8,1,power_law_1.01,0.38939518928527833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,8,1,power_law_1.01,0.40543360710144044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,8,1,power_law_1.2,0.385100793838501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2048,8,256,8,1,power_law_1.2,0.39044480323791503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,1,balanced,2.3326613108317056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,1,balanced,2.3594719568888345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,1,power_law_1.01,2.2091455459594727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,1,power_law_1.01,2.219897651672363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,1,power_law_1.2,2.192723274230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,1,power_law_1.2,2.223673629760742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,16,balanced,0.24541334311167398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,16,balanced,0.24849599599838257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,16,power_law_1.01,0.23420801162719726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,16,power_law_1.01,0.23998720645904542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,16,power_law_1.2,0.23500800132751465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,16,power_law_1.2,0.24413440227508545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,2,balanced,1.2464906374613445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,2,balanced,1.2561333179473877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,2,power_law_1.01,1.114137554168701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,2,power_law_1.01,1.1272640228271484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,2,power_law_1.2,1.164902400970459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,2,power_law_1.2,1.1750144004821776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,32,balanced,0.1584213376045227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,32,balanced,0.16009599963823953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,32,power_law_1.01,0.153164803981781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,32,power_law_1.01,0.15629440546035767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,32,power_law_1.2,0.15780479907989503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,32,power_law_1.2,0.15790079832077025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,4,balanced,0.6570880015691122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,4,balanced,0.6593013207117716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,4,power_law_1.01,0.6297664165496826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,4,power_law_1.01,0.6408063888549804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,4,power_law_1.2,0.6278016090393066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,4,power_law_1.2,0.6428991794586182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,8,balanced,0.3754506508509318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,8,balanced,0.3768639961878459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,8,power_law_1.01,0.35489280223846437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,8,power_law_1.01,0.3566335916519165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,8,power_law_1.2,0.3654335975646973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,1,8,power_law_1.2,0.36725759506225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,16,1,balanced,0.26390933990478516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,16,1,balanced,0.26554665962855023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,16,1,power_law_1.01,0.21217920780181884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,16,1,power_law_1.01,0.22330880165100098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,16,1,power_law_1.2,0.2320512056350708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,16,1,power_law_1.2,0.24856319427490234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,2,1,balanced,1.2191893259684246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,2,1,balanced,1.220293362935384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,2,1,power_law_1.01,1.0857151985168456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,2,1,power_law_1.01,1.1062399864196777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,2,1,power_law_1.2,1.1371392250061034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,2,1,power_law_1.2,1.144972801208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,32,1,balanced,0.18375466267267862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,32,1,balanced,0.1841119925181071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,32,1,power_law_1.01,0.17405439615249635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,32,1,power_law_1.01,0.17530879974365235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,32,1,power_law_1.2,0.17496960163116454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,32,1,power_law_1.2,0.17566720247268677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,4,1,balanced,0.6354399919509888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,4,1,balanced,0.6375093460083008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,4,1,power_law_1.01,0.5997824192047119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,4,1,power_law_1.01,0.605625581741333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,4,1,power_law_1.2,0.6074240207672119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,4,1,power_law_1.2,0.6104000091552735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,8,1,balanced,0.35582931836446124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,8,1,balanced,0.3567039966583252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,8,1,power_law_1.01,0.33208959102630614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,8,1,power_law_1.01,0.34149119853973386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,8,1,power_law_1.2,0.3420864105224609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,6144,2560,8,160,8,1,power_law_1.2,0.34542078971862794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,1,balanced,3.4616053899129233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,1,balanced,3.462922732035319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,1,power_law_1.01,2.89483528137207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,1,power_law_1.01,2.899897575378418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,1,power_law_1.2,2.8910400390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,1,power_law_1.2,2.9890815734863283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,128,balanced,0.17878933747609457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,128,balanced,0.17969600359598795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,128,power_law_1.01,0.17682559490203859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,128,power_law_1.01,0.1769919991493225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,128,power_law_1.2,0.1760256052017212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,128,power_law_1.2,0.17690880298614503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,16,balanced,0.3760586579640706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,16,balanced,0.37864001592000324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,16,power_law_1.01,0.3468672037124634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,16,power_law_1.01,0.3550591945648193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,16,power_law_1.2,0.3261248111724854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,16,power_law_1.2,0.3664128065109253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,2,balanced,1.8597013155619304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,2,balanced,1.893679936726888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,2,power_law_1.01,1.5554240226745606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,2,power_law_1.01,1.5826944351196288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,2,power_law_1.2,1.533132839202881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,2,power_law_1.2,1.558732795715332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,256,balanced,0.17602666219075522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,256,balanced,0.17685333887736002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,256,power_law_1.01,0.17310719490051268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,256,power_law_1.01,0.17359999418258668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,256,power_law_1.2,0.1729856014251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,256,power_law_1.2,0.17348480224609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,32,balanced,0.24067733685175577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,32,balanced,0.2408213416735331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,32,power_law_1.01,0.22963199615478516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,32,power_law_1.01,0.23308160305023193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,32,power_law_1.2,0.22371840476989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,32,power_law_1.2,0.23300480842590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,4,balanced,0.9722080230712891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,4,balanced,0.9732586542765299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,4,power_law_1.01,0.8217856407165527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,4,power_law_1.01,0.8693056106567383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,4,power_law_1.2,0.8598143577575683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,4,power_law_1.2,0.8908864021301269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,64,balanced,0.18817599614461264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,64,balanced,0.18876266479492188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,64,power_law_1.01,0.18416639566421508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,64,power_law_1.01,0.1851263999938965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,64,power_law_1.2,0.1845247983932495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,64,power_law_1.2,0.18568960428237916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,8,balanced,0.5742133458455404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,8,balanced,0.5785866578420004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,8,power_law_1.01,0.4821184158325195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,8,power_law_1.01,0.5269440174102783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,8,power_law_1.2,0.5171775817871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,1,8,power_law_1.2,0.549561595916748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,16,1,balanced,0.3729120095570882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,16,1,balanced,0.3729226589202881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,16,1,power_law_1.01,0.29361920356750487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,16,1,power_law_1.01,0.2946880102157593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,16,1,power_law_1.2,0.29424641132354734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,16,1,power_law_1.2,0.3066943883895874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,2,1,balanced,1.8233760197957356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,2,1,balanced,1.8505279223124187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,2,1,power_law_1.01,1.5118399620056153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,2,1,power_law_1.01,1.5202816009521485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,2,1,power_law_1.2,1.4952768325805663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,2,1,power_law_1.2,1.5409728050231934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,32,1,balanced,0.2547679940859477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,32,1,balanced,0.25626667340596515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,32,1,power_law_1.01,0.23474559783935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,32,1,power_law_1.01,0.23676800727844238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,32,1,power_law_1.2,0.23746559619903565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,32,1,power_law_1.2,0.2385472059249878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,4,1,balanced,0.9284959634145101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,4,1,balanced,0.9320106506347656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,4,1,power_law_1.01,0.7944511890411377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,4,1,power_law_1.01,0.7996479988098144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,4,1,power_law_1.2,0.7841792106628418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,4,1,power_law_1.2,0.7923200130462646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,8,1,balanced,0.5484373172124227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,8,1,balanced,0.5507839918136597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,8,1,power_law_1.01,0.4534656047821045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,8,1,power_law_1.01,0.4547264099121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,8,1,power_law_1.2,0.44657278060913086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,256,8,1,power_law_1.2,0.46712961196899416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,1,balanced,5.418799718221028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,1,balanced,5.555440266927083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,1,power_law_1.01,4.06822395324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,1,power_law_1.01,4.068832015991211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,1,power_law_1.2,4.0777534484863285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,1,power_law_1.2,4.163372802734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,128,balanced,0.22593067089716592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,128,balanced,0.22831465800603232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,128,power_law_1.01,0.22554240226745606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,128,power_law_1.01,0.22570879459381105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,128,power_law_1.2,0.2240895986557007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,128,power_law_1.2,0.22442240715026857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,16,balanced,0.5055253505706787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,16,balanced,0.5058826605478922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,16,power_law_1.01,0.46652798652648925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,16,power_law_1.01,0.4692863941192627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,16,power_law_1.2,0.4258431911468506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,16,power_law_1.2,0.4690688133239746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,2,balanced,2.745141347249349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,2,balanced,2.7982346216837564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,2,power_law_1.01,2.1170560836791994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,2,power_law_1.01,2.1325183868408204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,2,power_law_1.2,2.0416448593139647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,2,power_law_1.2,2.175609588623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,32,balanced,0.3468960126241048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,32,balanced,0.34832000732421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,32,power_law_1.01,0.3151808023452759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,32,power_law_1.01,0.3219327926635742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,32,power_law_1.2,0.3142143964767456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,32,power_law_1.2,0.3301568031311035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,4,balanced,1.4383893013000488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,4,balanced,1.4524532953898113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,4,power_law_1.01,1.1582719802856445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,4,power_law_1.01,1.2347519874572754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,4,power_law_1.2,1.1952832221984864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,4,power_law_1.2,1.2091839790344239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,64,balanced,0.2509760061899821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,64,balanced,0.2526400089263916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,64,power_law_1.01,0.24414079189300536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,64,power_law_1.01,0.24732799530029298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,64,power_law_1.2,0.24183039665222167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,64,power_law_1.2,0.24204800128936768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,8,balanced,0.8153173128763834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,8,balanced,0.8213866551717123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,8,power_law_1.01,0.6519552230834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,8,power_law_1.01,0.6974016189575195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,8,power_law_1.2,0.6935359954833984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,1,8,power_law_1.2,0.713804817199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,16,1,balanced,0.4862133264541626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,16,1,balanced,0.48908265431722003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,16,1,power_law_1.01,0.42298240661621095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,16,1,power_law_1.01,0.42684159278869627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,16,1,power_law_1.2,0.4210944175720215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,16,1,power_law_1.2,0.42281599044799806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,2,1,balanced,2.743664105733236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,2,1,balanced,2.7475999196370444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,2,1,power_law_1.01,2.0708288192749023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,2,1,power_law_1.01,2.077689552307129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,2,1,power_law_1.2,2.0167360305786133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,2,1,power_law_1.2,2.0466495513916017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,32,1,balanced,0.35046935081481934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,32,1,balanced,0.3512800137201945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,32,1,power_law_1.01,0.30417919158935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,32,1,power_law_1.01,0.30687999725341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,32,1,power_law_1.2,0.30088319778442385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,32,1,power_law_1.2,0.3010495901107788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,4,1,balanced,1.3614506721496582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,4,1,balanced,1.3823787371317546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,4,1,power_law_1.01,1.082329559326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,4,1,power_law_1.01,1.094438362121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,4,1,power_law_1.2,1.0671680450439454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,4,1,power_law_1.2,1.0800767898559571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,8,1,balanced,0.7779359817504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,8,1,balanced,0.7812159856160482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,8,1,power_law_1.01,0.6181759834289551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,8,1,power_law_1.01,0.6208320140838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,8,1,power_law_1.2,0.6160895824432373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,160,7168,2048,8,384,8,1,power_law_1.2,0.6191999912261963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,1,balanced,1.6393653551737468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,1,balanced,1.6711680094401042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,1,power_law_1.01,1.8010879516601563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,1,power_law_1.01,1.8174335479736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,1,power_law_1.2,1.8243648529052734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,1,power_law_1.2,1.8310976028442383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,128,balanced,0.7683573563893636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,128,balanced,0.7708799839019775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,128,power_law_1.01,0.859398365020752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,128,power_law_1.01,0.8657600402832031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,128,power_law_1.2,0.9105471611022949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,128,power_law_1.2,0.9196224212646484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,16,balanced,0.8421066602071127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,16,balanced,0.8439520200093588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,16,power_law_1.01,0.9518976211547852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,16,power_law_1.01,0.9777728080749511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,16,power_law_1.2,1.036633586883545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,16,power_law_1.2,1.0736576080322267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,2,balanced,1.4299519856770833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,2,balanced,1.4333972930908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,2,power_law_1.01,1.5049344062805177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,2,power_law_1.01,1.5679167747497558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,2,power_law_1.2,1.5297727584838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,2,power_law_1.2,1.6224447250366212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,32,balanced,0.7996160189310709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,32,balanced,0.8047146797180176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,32,power_law_1.01,0.9095423698425293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,32,power_law_1.01,0.9141823768615722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,32,power_law_1.2,0.9355456352233886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,32,power_law_1.2,0.9357376098632812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,4,balanced,1.095018704732259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,4,balanced,1.0961439609527588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,4,power_law_1.01,1.1909184455871582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,4,power_law_1.01,1.1987903594970704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,4,power_law_1.2,1.264236831665039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,4,power_law_1.2,1.2992192268371583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,64,balanced,0.7808266480763754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,64,balanced,0.7821173667907715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,64,power_law_1.01,0.8667327880859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,64,power_law_1.01,0.8702655792236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,64,power_law_1.2,0.9216896057128906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,64,power_law_1.2,0.9368255615234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,8,balanced,0.9279200236002604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,8,balanced,0.9285013675689697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,8,power_law_1.01,1.022758388519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,8,power_law_1.01,1.1131072044372559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,8,power_law_1.2,1.1310144424438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,1,8,power_law_1.2,1.1379263877868653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,2,1,balanced,1.247989336649577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,2,1,balanced,1.2567839622497559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,2,1,power_law_1.01,1.3253888130187987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,2,1,power_law_1.01,1.3263744354248046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,2,1,power_law_1.2,1.3282879829406737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,2,1,power_law_1.2,1.3340352058410645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,4,1,balanced,0.9382293224334717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,4,1,balanced,0.9467679659525553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,4,1,power_law_1.01,0.9853311538696289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,4,1,power_law_1.01,0.9853568077087402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,4,1,power_law_1.2,0.9859456062316895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2048,768,8,128,4,1,power_law_1.2,0.9886528015136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,1,balanced,3.750917434692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,1,balanced,3.769909222920736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,1,power_law_1.01,3.9966720581054687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,1,power_law_1.01,4.0729728698730465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,1,power_law_1.2,4.008422470092773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,1,power_law_1.2,4.023519897460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,128,balanced,1.003328005472819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,128,balanced,1.0056053002675374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,128,power_law_1.01,1.1607999801635742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,128,power_law_1.01,1.1626175880432128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,128,power_law_1.2,1.3611007690429688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,128,power_law_1.2,1.3812352180480958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,16,balanced,1.1659306685129802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,16,balanced,1.1670133272806804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,16,power_law_1.01,1.3854016304016112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,16,power_law_1.01,1.4120512008666992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,16,power_law_1.2,1.5272255897521974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,16,power_law_1.2,1.620319938659668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,2,balanced,2.5002026557922363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,2,balanced,2.510325272878011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,2,power_law_1.01,2.6791360855102537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,2,power_law_1.01,2.853446388244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,2,power_law_1.2,2.807027244567871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,2,power_law_1.2,2.9214336395263674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,32,balanced,1.0725066661834717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,32,balanced,1.073573350906372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,32,power_law_1.01,1.2431551933288574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,32,power_law_1.01,1.3091903686523438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,32,power_law_1.2,1.448953628540039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,32,power_law_1.2,1.5453951835632325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,4,balanced,1.7386080423990886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,4,balanced,1.7388052940368652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,4,power_law_1.01,1.9236799240112306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,4,power_law_1.01,2.013324737548828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,4,power_law_1.2,2.0716991424560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,4,power_law_1.2,2.0817407608032226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,64,balanced,1.026863972345988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,64,balanced,1.0275999704996746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,64,power_law_1.01,1.201516819000244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,64,power_law_1.01,1.2277440071105956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,64,power_law_1.2,1.300492763519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,64,power_law_1.2,1.4364352226257324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,8,balanced,1.355024019877116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,8,balanced,1.3550772666931152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,8,power_law_1.01,1.581721591949463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,8,power_law_1.01,1.6803903579711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,8,power_law_1.2,1.7055679321289063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,1,8,power_law_1.2,1.8314048767089843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,16,1,balanced,1.7534559567769368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,16,1,balanced,1.7560319900512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,16,1,power_law_1.01,1.8801151275634767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,16,1,power_law_1.01,1.8816703796386718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,16,1,power_law_1.2,1.9008127212524415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,16,1,power_law_1.2,1.9009151458740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,2,1,balanced,2.325295925140381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,2,1,balanced,2.3457066218058267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,2,1,power_law_1.01,2.426963233947754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,2,1,power_law_1.01,2.456812858581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,2,1,power_law_1.2,2.4166015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,2,1,power_law_1.2,2.4329471588134766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,32,1,balanced,1.461114724477132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,32,1,balanced,1.4643893241882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,32,1,power_law_1.01,1.551583957672119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,32,1,power_law_1.01,1.5530943870544434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,32,1,power_law_1.2,1.5638719558715821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,32,1,power_law_1.2,1.5673855781555175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,4,1,balanced,1.4860320091247559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,4,1,balanced,1.492186705271403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,4,1,power_law_1.01,1.5843520164489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,4,1,power_law_1.01,1.591808032989502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,4,1,power_law_1.2,1.5992447853088378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,4,1,power_law_1.2,1.6002111434936523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,8,1,balanced,2.1949332555135093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,8,1,balanced,2.195770740509033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,8,1,power_law_1.01,2.3577600479125977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,8,1,power_law_1.01,2.358451271057129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,8,1,power_law_1.2,2.3755327224731446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,2688,1856,6,128,8,1,power_law_1.2,2.3760576248168945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,1,balanced,5.407328287760417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,1,balanced,5.5225067138671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,1,power_law_1.01,5.740876770019531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,1,power_law_1.01,6.041388702392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,1,power_law_1.2,5.628607940673828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,1,power_law_1.2,5.878303909301758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,128,balanced,1.1894933382670085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,128,balanced,1.1915946801503499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,128,power_law_1.01,1.3278783798217773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,128,power_law_1.01,1.3361727714538574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,128,power_law_1.2,1.4572928428649903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,128,power_law_1.2,1.4828543663024902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,16,balanced,1.4067625999450684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,16,balanced,1.4098827044169109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,16,power_law_1.01,1.578713607788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,16,power_law_1.01,1.6178112030029297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,16,power_law_1.2,1.756051254272461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,16,power_law_1.2,1.7872575759887694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,2,balanced,3.2968266805013022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,2,balanced,3.372463862101237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,2,power_law_1.01,3.4554622650146483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,2,power_law_1.01,3.505779266357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,2,power_law_1.2,3.5950847625732423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,2,power_law_1.2,3.8232448577880858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,256,balanced,1.1739253203074138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,256,balanced,1.173967997233073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,256,power_law_1.01,1.2865344047546388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,256,power_law_1.01,1.2924863815307617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,256,power_law_1.2,1.418937587738037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,256,power_law_1.2,1.4669247627258302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,32,balanced,1.2803893089294434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,32,balanced,1.286959966023763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,32,power_law_1.01,1.4886464118957519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,32,power_law_1.01,1.5022208213806152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,32,power_law_1.2,1.5557503700256348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,32,power_law_1.2,1.643289566040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,4,balanced,2.167616049448649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,4,balanced,2.1858293215433755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,4,power_law_1.01,2.5806528091430665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,4,power_law_1.01,2.617964744567871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,4,power_law_1.2,2.5718719482421877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,4,power_law_1.2,2.606483268737793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,64,balanced,1.2193546295166016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,64,balanced,1.2206026713053386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,64,power_law_1.01,1.3751551628112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,64,power_law_1.01,1.398265552520752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,64,power_law_1.2,1.512384033203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,64,power_law_1.2,1.5958720207214356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,8,balanced,1.6597386995951335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,8,balanced,1.6631520589192708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,8,power_law_1.01,1.8628927230834962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,8,power_law_1.01,1.9326463699340821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,8,power_law_1.2,1.9743423461914062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,1,8,power_law_1.2,1.9859584808349608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,16,1,balanced,1.163647969563802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,16,1,balanced,1.166431983311971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,16,1,power_law_1.01,1.2544832229614258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,16,1,power_law_1.01,1.2578432083129882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,16,1,power_law_1.2,1.271718406677246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,16,1,power_law_1.2,1.2742464065551757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,2,1,balanced,2.898757298787435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,2,1,balanced,3.154714584350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,2,1,power_law_1.01,3.1711807250976562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,2,1,power_law_1.01,3.205414581298828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,2,1,power_law_1.2,3.2727935791015623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,2,1,power_law_1.2,3.293920135498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,32,1,balanced,1.001845359802246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,32,1,balanced,1.0037706693013508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,32,1,power_law_1.01,1.074892807006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,32,1,power_law_1.01,1.074988842010498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,32,1,power_law_1.2,1.0843263626098634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,32,1,power_law_1.2,1.0855615615844727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,4,1,balanced,1.8538719813028972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,4,1,balanced,1.8558826446533203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,4,1,power_law_1.01,1.9970815658569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,4,1,power_law_1.01,2.0070528030395507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,4,1,power_law_1.2,2.018079948425293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,4,1,power_law_1.2,2.0388736724853516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,8,1,balanced,1.3694559733072917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,8,1,balanced,1.3716799418131511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,8,1,power_law_1.01,1.4564288139343262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,8,1,power_law_1.01,1.4571968078613282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,8,1,power_law_1.2,1.4701312065124512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,3072,1536,8,256,8,1,power_law_1.2,1.4805631637573242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,1,balanced,15.416107177734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,1,balanced,15.547770182291666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,1,power_law_1.01,14.872230529785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,1,power_law_1.01,15.03148193359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,1,power_law_1.2,14.95911102294922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,1,power_law_1.2,15.115084838867187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,2,balanced,8.18508783976237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,2,balanced,8.226325352986654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,2,power_law_1.01,11.309158325195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,2,power_law_1.01,12.985658264160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,2,power_law_1.2,10.046604919433594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,2,power_law_1.2,10.318956756591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,4,balanced,4.724965413411458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,4,balanced,4.742789268493652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,4,power_law_1.01,11.020230102539063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,4,power_law_1.01,8.358758544921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,4,power_law_1.2,8.264633941650391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,4,power_law_1.2,8.538285064697266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,8,balanced,3.1280107498168945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,8,balanced,3.151935895284017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,8,power_law_1.01,7.562649536132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,8,power_law_1.01,7.6023101806640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,8,power_law_1.2,8.013504028320312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,1,8,power_law_1.2,8.198585510253906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,16,1,balanced,0.985765298207601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,16,1,balanced,0.9893759886423746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,16,1,power_law_1.01,1.0057920455932616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,16,1,power_law_1.01,1.0220864295959473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,16,1,power_law_1.2,1.0113535881042481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,16,1,power_law_1.2,1.0194368362426758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,2,1,balanced,6.841061274210612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,2,1,balanced,6.9873708089192705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,2,1,power_law_1.01,7.049638366699218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,2,1,power_law_1.01,7.123149108886719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,2,1,power_law_1.2,6.828230285644532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,2,1,power_law_1.2,6.884825897216797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,32,1,balanced,0.6631679932276408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,32,1,balanced,0.6667946974436442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,32,1,power_law_1.01,0.6765759944915771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,32,1,power_law_1.01,0.6791999816894532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,32,1,power_law_1.2,0.6791615962982178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,32,1,power_law_1.2,0.6802112102508545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,4,1,balanced,3.276538530985514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,4,1,balanced,3.444416046142578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,4,1,power_law_1.01,3.2293121337890627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,4,1,power_law_1.01,3.247590255737305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,4,1,power_law_1.2,3.2396160125732423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,4,1,power_law_1.2,3.243500900268555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,8,1,balanced,1.7019519805908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,8,1,balanced,1.7107680638631184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,8,1,power_law_1.01,1.7154111862182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,8,1,power_law_1.01,1.734329605102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,8,1,power_law_1.2,1.7421503067016602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,14336,2,8,8,1,power_law_1.2,1.7451904296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,1,balanced,6.477333068847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,1,balanced,6.516986846923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,1,power_law_1.01,6.8421180725097654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,1,power_law_1.01,6.922873687744141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,1,power_law_1.2,6.540799713134765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,1,power_law_1.2,6.792684936523438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,128,balanced,1.3539519309997559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,128,balanced,1.3545653025309246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,128,power_law_1.01,1.6222911834716798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,128,power_law_1.01,1.6552640914916992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,128,power_law_1.2,1.8651199340820312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,128,power_law_1.2,1.871558380126953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,16,balanced,1.6220746040344238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,16,balanced,1.6236426035563152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,16,power_law_1.01,2.089958381652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,16,power_law_1.01,2.0954687118530275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,16,power_law_1.2,2.2208831787109373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,16,power_law_1.2,2.2248064041137696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,2,balanced,3.8934240341186523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,2,balanced,3.96450138092041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,2,power_law_1.01,4.24705924987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,2,power_law_1.01,4.250873565673828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,2,power_law_1.2,4.329216003417969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,2,power_law_1.2,4.6889087677001955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,32,balanced,1.465877374013265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,32,balanced,1.4694347381591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,32,power_law_1.01,1.824025535583496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,32,power_law_1.01,1.8580608367919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,32,power_law_1.2,2.066559982299805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,32,power_law_1.2,2.1076032638549806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,4,balanced,2.5529866218566895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,4,balanced,2.5570027033487954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,4,power_law_1.01,3.0781248092651365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,4,power_law_1.01,3.2320831298828123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,4,power_law_1.2,3.171238327026367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,4,power_law_1.2,3.3759361267089845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,64,balanced,1.3927146593729656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,64,balanced,1.3975946108500164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,64,power_law_1.01,1.7166719436645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,64,power_law_1.01,1.7346815109252929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,64,power_law_1.2,1.8656959533691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,64,power_law_1.2,2.0382720947265627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,8,balanced,1.9308586120605469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,8,balanced,1.9322400093078613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,8,power_law_1.01,2.2851583480834963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,8,power_law_1.01,2.35677433013916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,8,power_law_1.2,2.526265525817871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,1,8,power_law_1.2,2.5604223251342773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,16,1,balanced,1.4518826802571614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,16,1,balanced,1.4545599619547527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,16,1,power_law_1.01,1.5315520286560058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,16,1,power_law_1.01,1.5348992347717285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,16,1,power_law_1.2,1.5406528472900392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,16,1,power_law_1.2,1.5418432235717774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,2,1,balanced,3.0593652725219727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,2,1,balanced,3.0667041142781577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,2,1,power_law_1.01,3.2196990966796877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,2,1,power_law_1.01,3.330495834350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,2,1,power_law_1.2,3.239481735229492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,2,1,power_law_1.2,3.335488128662109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,32,1,balanced,1.2468266487121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,32,1,balanced,1.2476426760355632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,32,1,power_law_1.01,1.303328037261963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,32,1,power_law_1.01,1.3035840034484862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,32,1,power_law_1.2,1.3098176002502442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,32,1,power_law_1.2,1.315884780883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,4,1,balanced,2.255727926890055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,4,1,balanced,2.2727306683858237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,4,1,power_law_1.01,2.395699119567871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,4,1,power_law_1.01,2.414918327331543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,4,1,power_law_1.2,2.402547264099121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,4,1,power_law_1.2,2.40578556060791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,8,1,balanced,1.6851305961608887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,8,1,balanced,1.691263993581136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,8,1,power_law_1.01,1.768351936340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,8,1,power_law_1.01,1.7697792053222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,8,1,power_law_1.2,1.7765567779541016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,1536,8,128,8,1,power_law_1.2,1.778099250793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,1,balanced,37.61187235514323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,1,balanced,37.61830393473307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,1,power_law_1.01,34.57859802246094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,1,power_law_1.01,35.022509765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,1,power_law_1.2,35.4528564453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,1,power_law_1.2,36.3662841796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,128,balanced,4.934090614318848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,128,balanced,4.940410614013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,128,power_law_1.01,5.484070587158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,128,power_law_1.01,5.528646469116211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,128,power_law_1.2,5.977536010742187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,128,power_law_1.2,6.018572616577148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,16,balanced,6.475034713745117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,16,balanced,6.489909489949544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,16,power_law_1.01,7.1225532531738285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,16,power_law_1.01,7.480281829833984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,16,power_law_1.2,7.951116943359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,16,power_law_1.2,8.3531005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,2,balanced,21.516751607259113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,2,balanced,22.10741424560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,2,power_law_1.01,20.14600372314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,2,power_law_1.01,21.068179321289062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,2,power_law_1.2,21.82953643798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,2,power_law_1.2,22.6221435546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,256,balanced,4.81657059987386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,256,balanced,4.8261919021606445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,256,power_law_1.01,5.318745422363281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,256,power_law_1.01,5.36487045288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,256,power_law_1.2,5.738681411743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,256,power_law_1.2,5.85849609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,32,balanced,5.583765029907227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,32,balanced,5.59329096476237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,32,power_law_1.01,6.466194915771484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,32,power_law_1.01,6.548838043212891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,32,power_law_1.2,6.91673583984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,32,power_law_1.2,7.335052490234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,4,balanced,12.3176638285319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,4,balanced,12.704176584879557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,4,power_law_1.01,13.096141052246093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,4,power_law_1.01,13.777638244628907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,4,power_law_1.2,13.630149841308594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,4,power_law_1.2,14.24388427734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,64,balanced,5.155690511067708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,64,balanced,5.15671984354655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,64,power_law_1.01,5.741811370849609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,64,power_law_1.01,5.8813823699951175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,64,power_law_1.2,6.2833984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,64,power_law_1.2,6.385561752319336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,8,balanced,8.249850591023764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,8,balanced,8.275360107421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,8,power_law_1.01,9.027954864501954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,8,power_law_1.01,9.570880126953124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,8,power_law_1.2,10.233869171142578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,1,8,power_law_1.2,9.346720123291016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,16,1,balanced,10.425429026285807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,16,1,balanced,10.429573059082031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,16,1,power_law_1.01,10.60830078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,16,1,power_law_1.01,10.616236877441406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,16,1,power_law_1.2,10.666643524169922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,16,1,power_law_1.2,10.686431884765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,2,1,balanced,16.688133239746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,2,1,balanced,17.38969548543294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,2,1,power_law_1.01,16.674656677246094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,2,1,power_law_1.01,17.230892944335938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,2,1,power_law_1.2,16.949055480957032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,2,1,power_law_1.2,16.994528198242186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,32,1,balanced,9.192453384399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,32,1,balanced,9.206975936889648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,32,1,power_law_1.01,9.310374450683593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,32,1,power_law_1.01,9.33004150390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,32,1,power_law_1.2,9.423334503173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,32,1,power_law_1.2,9.428717041015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,4,1,balanced,33.17146555582682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,4,1,balanced,33.2688954671224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,4,1,power_law_1.01,33.3640380859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,4,1,power_law_1.01,33.557073974609374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,4,1,power_law_1.2,33.18160705566406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,4,1,power_law_1.2,33.33994750976562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,8,1,balanced,7.00059191385905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,8,1,balanced,7.05668830871582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,8,1,power_law_1.01,6.878380584716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,8,1,power_law_1.01,6.945753479003907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,8,1,power_law_1.2,6.776480102539063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,4096,2688,22,512,8,1,power_law_1.2,6.934719848632812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,1,balanced,25.874593098958332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,1,balanced,26.748921712239582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,1,power_law_1.01,24.9706298828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,1,power_law_1.01,25.256346130371092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,1,power_law_1.2,24.99897003173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,1,power_law_1.2,25.210169982910156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,2,balanced,12.893882751464844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,2,balanced,13.834453582763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,2,power_law_1.01,20.290374755859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,2,power_law_1.01,23.12230987548828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,2,power_law_1.2,17.908601379394533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,2,power_law_1.2,18.236653137207032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,4,balanced,7.42255973815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,4,balanced,7.589557647705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,4,power_law_1.01,12.861772155761718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,4,power_law_1.01,14.258309936523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,4,power_law_1.2,12.973619079589843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,4,power_law_1.2,16.33994903564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,8,balanced,4.485146522521973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,8,balanced,4.583919843037923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,8,power_law_1.01,12.542861175537109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,8,power_law_1.01,13.21829833984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,8,power_law_1.2,13.014495849609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,1,8,power_law_1.2,13.154182434082031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,16,1,balanced,1.5946666399637859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,16,1,balanced,1.6290027300516765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,16,1,power_law_1.01,1.6336000442504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,16,1,power_law_1.01,1.6387136459350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,16,1,power_law_1.2,1.6220287322998046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,16,1,power_law_1.2,1.6359872817993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,2,1,balanced,11.873274485270182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,2,1,balanced,12.09170659383138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,2,1,power_law_1.01,11.891404724121093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,2,1,power_law_1.01,12.121810913085938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,2,1,power_law_1.2,12.002617645263673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,2,1,power_law_1.2,12.046431732177734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,32,1,balanced,1.0107733408610027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,32,1,balanced,1.0149919986724854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,32,1,power_law_1.01,1.0364352226257325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,32,1,power_law_1.01,1.0470463752746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,32,1,power_law_1.2,1.0428288459777832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,32,1,power_law_1.2,1.0584320068359374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,4,1,balanced,5.641045252482097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,4,1,balanced,5.673381169637044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,4,1,power_law_1.01,5.5709888458251955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,4,1,power_law_1.01,5.585305786132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,4,1,power_law_1.2,5.5996543884277346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,4,1,power_law_1.2,5.6212158203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,8,1,balanced,2.9550612767537436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,8,1,balanced,3.000800132751465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,8,1,power_law_1.01,2.836684799194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,8,1,power_law_1.01,2.8808576583862306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,8,1,power_law_1.2,2.8443647384643556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,16384,2,8,8,1,power_law_1.2,2.8929344177246095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,1,balanced,13.715775807698568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,1,balanced,14.136853535970053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,1,power_law_1.01,15.155020141601563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,1,power_law_1.01,15.197415161132813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,1,power_law_1.2,14.71619873046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,1,power_law_1.2,15.373849487304687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,128,balanced,1.9690933227539062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,128,balanced,1.9737812678019206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,128,power_law_1.01,2.317856025695801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,128,power_law_1.01,2.370470428466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,128,power_law_1.2,2.6258047103881834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,128,power_law_1.2,2.666592025756836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,16,balanced,2.544725259145101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,16,balanced,2.558010737101237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,16,power_law_1.01,3.3145984649658202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,16,power_law_1.01,3.3505279541015627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,16,power_law_1.2,3.5035518646240233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,16,power_law_1.2,3.6134078979492186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,2,balanced,7.880570729573567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,2,balanced,7.9458878835042315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,2,power_law_1.01,8.694668579101563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,2,power_law_1.01,8.827308654785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,2,power_law_1.2,9.093068695068359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,2,power_law_1.2,9.547532653808593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,256,balanced,1.9327999750773113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,256,balanced,1.940933386484782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,256,power_law_1.01,2.2171648025512694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,256,power_law_1.01,2.227168083190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,256,power_law_1.2,2.581337547302246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,256,power_law_1.2,2.7175615310668944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,32,balanced,2.208453337351481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,32,balanced,2.208698590596517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,32,power_law_1.01,2.7257408142089843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,32,power_law_1.01,2.769664001464844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,32,power_law_1.2,3.0034303665161133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,32,power_law_1.2,3.1656896591186525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,4,balanced,4.705103874206543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,4,balanced,4.791802724202474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,4,power_law_1.01,5.504851150512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,4,power_law_1.01,6.182259368896484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,4,power_law_1.2,5.910572814941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,4,power_law_1.2,6.409394836425781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,64,balanced,2.0561653772989907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,64,balanced,2.059541384379069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,64,power_law_1.01,2.44586238861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,64,power_law_1.01,2.474905586242676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,64,power_law_1.2,2.971897506713867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,64,power_law_1.2,2.990969657897949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,8,balanced,3.24016539255778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,8,balanced,3.2517385482788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,8,power_law_1.01,3.7740928649902346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,8,power_law_1.01,3.818431854248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,8,power_law_1.2,4.419571304321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,1,8,power_law_1.2,4.448729705810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,16,1,balanced,2.14410130182902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,16,1,balanced,2.1451147397359214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,16,1,power_law_1.01,2.2879743576049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,16,1,power_law_1.01,2.294771194458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,16,1,power_law_1.2,2.3185407638549806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,16,1,power_law_1.2,2.3190656661987306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,2,1,balanced,6.97979736328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,2,1,balanced,7.1873016357421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,2,1,power_law_1.01,7.685523223876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,2,1,power_law_1.01,7.739250946044922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,2,1,power_law_1.2,7.9960578918457035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,2,1,power_law_1.2,8.09359359741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,32,1,balanced,1.8298826217651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,32,1,balanced,1.8307305971781414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,32,1,power_law_1.01,1.9517951965332032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,32,1,power_law_1.01,1.9552320480346679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,32,1,power_law_1.2,1.972902488708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,32,1,power_law_1.2,1.976473617553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,4,1,balanced,4.003978729248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,4,1,balanced,4.318160057067871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,4,1,power_law_1.01,4.51341438293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,4,1,power_law_1.01,4.525907135009765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,4,1,power_law_1.2,4.562195205688477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,4,1,power_law_1.2,4.5943550109863285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,8,1,balanced,2.787306785583496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,8,1,balanced,2.8056586583455405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,8,1,power_law_1.01,2.9710975646972657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,8,1,power_law_1.01,2.9895551681518553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,8,1,power_law_1.2,3.0170495986938475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2048,8,256,8,1,power_law_1.2,3.034752082824707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,1,balanced,17.581204732259113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,1,balanced,17.639787038167317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,1,power_law_1.01,17.160231018066405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,1,power_law_1.01,17.323423767089842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,1,power_law_1.2,16.945158386230467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,1,power_law_1.2,17.424345397949217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,16,balanced,2.866522789001465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,16,balanced,2.8855412801106772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,16,power_law_1.01,3.674585723876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,16,power_law_1.01,3.957408142089844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,16,power_law_1.2,4.158284759521484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,16,power_law_1.2,4.4183296203613285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,2,balanced,9.680330912272135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,2,balanced,9.790858586629232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,2,power_law_1.01,10.145798492431641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,2,power_law_1.01,11.160902404785157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,2,power_law_1.2,10.541734313964843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,2,power_law_1.2,10.683103942871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,32,balanced,2.439194679260254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,32,balanced,2.4416799545288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,32,power_law_1.01,3.1770303726196287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,32,power_law_1.01,3.416864013671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,32,power_law_1.2,3.685023880004883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,32,power_law_1.2,4.007948684692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,4,balanced,5.667695999145508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,4,balanced,5.857776006062825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,4,power_law_1.01,6.545222473144531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,4,power_law_1.01,7.252448272705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,4,power_law_1.2,6.548134613037109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,4,power_law_1.2,7.1759490966796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,8,balanced,3.7700106302897134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,8,balanced,3.770602544148763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,8,power_law_1.01,4.641177749633789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,8,power_law_1.01,4.70832633972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,8,power_law_1.2,5.617881774902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,1,8,power_law_1.2,5.655456161499023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,16,1,balanced,2.5180320739746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,16,1,balanced,2.5225226084391275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,16,1,power_law_1.01,2.539737510681152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,16,1,power_law_1.01,2.545043182373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,16,1,power_law_1.2,2.552627182006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,16,1,power_law_1.2,2.552672004699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,2,1,balanced,9.010992050170898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,2,1,balanced,9.21997324625651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,2,1,power_law_1.01,8.7176513671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,2,1,power_law_1.01,8.922061157226562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,2,1,power_law_1.2,8.72723846435547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,2,1,power_law_1.2,9.061580657958984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,32,1,balanced,2.175898710886637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,32,1,balanced,2.176976044972738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,32,1,power_law_1.01,2.188140869140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,32,1,power_law_1.01,2.1937536239624023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,32,1,power_law_1.2,2.207731246948242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,32,1,power_law_1.2,2.2078847885131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,4,1,balanced,5.08460267384847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,4,1,balanced,5.103631973266602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,4,1,power_law_1.01,5.0771137237548825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,4,1,power_law_1.01,5.143667221069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,4,1,power_law_1.2,5.025779342651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,4,1,power_law_1.2,5.049766540527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,8,1,balanced,3.1609973907470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,8,1,balanced,3.21669864654541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,8,1,power_law_1.01,3.1939456939697264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,8,1,power_law_1.01,3.2168960571289062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,8,1,power_law_1.2,3.1832447052001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,6144,2560,8,160,8,1,power_law_1.2,3.2105281829833983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,1,balanced,15.808298746744791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,1,balanced,16.219343821207683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,1,power_law_1.01,17.384518432617188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,1,power_law_1.01,17.71474609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,1,power_law_1.2,17.60963134765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,1,power_law_1.2,18.061599731445312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,128,balanced,2.1749919255574546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,128,balanced,2.178277333577474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,128,power_law_1.01,2.62225284576416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,128,power_law_1.01,2.6242624282836915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,128,power_law_1.2,3.1025983810424806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,128,power_law_1.2,3.1117759704589845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,16,balanced,2.8551413218180337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,16,balanced,2.8633705774943032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,16,power_law_1.01,3.562451171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,16,power_law_1.01,3.6312511444091795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,16,power_law_1.2,4.047308731079101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,16,power_law_1.2,4.194432067871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,2,balanced,9.020495732625326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,2,balanced,9.213333129882812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,2,power_law_1.01,10.312274932861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,2,power_law_1.01,10.438912200927735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,2,power_law_1.2,10.726048278808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,2,power_law_1.2,10.727571105957031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,256,balanced,2.1319360733032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,256,balanced,2.1427787144978843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,256,power_law_1.01,2.4687616348266603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,256,power_law_1.01,2.4996927261352537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,256,power_law_1.2,3.056243133544922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,256,power_law_1.2,3.0851648330688475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,32,balanced,2.4551679293314614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,32,balanced,2.458357334136963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,32,power_law_1.01,3.132614326477051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,32,power_law_1.01,3.2416126251220705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,32,power_law_1.2,3.5212032318115236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,32,power_law_1.2,3.6831615447998045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,4,balanced,5.259418805440267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,4,balanced,5.400149027506511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,4,power_law_1.01,6.4714813232421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,4,power_law_1.01,6.492633819580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,4,power_law_1.2,6.994182586669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,4,power_law_1.2,7.144441223144531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,64,balanced,2.27073605855306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,64,balanced,2.2796427408854165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,64,power_law_1.01,2.7461503982543944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,64,power_law_1.01,2.931007957458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,64,power_law_1.2,3.1769535064697267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,64,power_law_1.2,3.241516876220703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,8,balanced,3.6331679026285806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,8,balanced,3.661967913309733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,8,power_law_1.01,4.45904655456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,8,power_law_1.01,4.747846221923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,8,power_law_1.2,4.853952026367187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,1,8,power_law_1.2,5.390195083618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,16,1,balanced,2.4661547342936196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,16,1,balanced,2.4776426951090493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,16,1,power_law_1.01,2.637446403503418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,16,1,power_law_1.01,2.64005126953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,16,1,power_law_1.2,2.664659118652344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,16,1,power_law_1.2,2.67127685546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,2,1,balanced,8.127077102661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,2,1,balanced,8.420527776082357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,2,1,power_law_1.01,9.063430023193359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,2,1,power_law_1.01,9.154803466796874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,2,1,power_law_1.2,9.12147216796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,2,1,power_law_1.2,9.526950073242187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,32,1,balanced,2.105290730794271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,32,1,balanced,2.1066187222798667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,32,1,power_law_1.01,2.2403327941894533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,32,1,power_law_1.01,2.2490495681762694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,32,1,power_law_1.2,2.2608320236206056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,32,1,power_law_1.2,2.2680896759033202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,4,1,balanced,4.894010543823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,4,1,balanced,5.059856096903483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,4,1,power_law_1.01,5.267974472045898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,4,1,power_law_1.01,5.322316741943359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,4,1,power_law_1.2,5.171660614013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,4,1,power_law_1.2,5.279679870605468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,8,1,balanced,3.254138628641764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,8,1,balanced,3.257882754007975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,8,1,power_law_1.01,3.46033935546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,8,1,power_law_1.01,3.5019199371337892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,8,1,power_law_1.2,3.4722305297851563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,256,8,1,power_law_1.2,3.4865345001220702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,1,balanced,17.751968383789062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,1,balanced,19.113141377766926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,1,power_law_1.01,19.54979248046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,1,power_law_1.01,19.83461151123047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,1,power_law_1.2,19.81769561767578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,1,power_law_1.2,19.995033264160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,128,balanced,2.2503466606140137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,128,balanced,2.2505173683166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,128,power_law_1.01,2.5843711853027345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,128,power_law_1.01,2.588755226135254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,128,power_law_1.2,2.886886405944824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,128,power_law_1.2,2.9781375885009767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,16,balanced,3.0192693074544272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,16,balanced,3.030186653137207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,16,power_law_1.01,3.587865447998047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,16,power_law_1.01,3.628851318359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,16,power_law_1.2,4.043609619140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,16,power_law_1.2,4.113619232177735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,2,balanced,10.270544052124023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,2,balanced,10.487157185872396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,2,power_law_1.01,11.078662109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,2,power_law_1.01,11.691737365722656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,2,power_law_1.2,11.517766571044922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,2,power_law_1.2,12.091558074951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,32,balanced,2.5743786493937173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,32,balanced,2.5893759727478027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,32,power_law_1.01,2.9823360443115234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,32,power_law_1.01,3.0306751251220705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,32,power_law_1.2,3.2829952239990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,32,power_law_1.2,3.4916030883789064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,4,balanced,5.887770970662435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,4,balanced,5.907941182454427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,4,power_law_1.01,6.5028541564941404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,4,power_law_1.01,6.7359870910644535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,4,power_law_1.2,6.996281433105469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,4,power_law_1.2,7.899942779541016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,64,balanced,2.356346607208252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,64,balanced,2.358799934387207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,64,power_law_1.01,2.77891845703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,64,power_law_1.01,2.8235647201538088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,64,power_law_1.2,2.979948806762695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,64,power_law_1.2,3.089030456542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,8,balanced,3.9326346715291343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,8,balanced,3.9629440307617188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,8,power_law_1.01,4.446783828735351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,8,power_law_1.01,4.565977478027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,8,power_law_1.2,5.0908863067626955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,1,8,power_law_1.2,5.4559680938720705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,16,1,balanced,2.7175413767496743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,16,1,balanced,2.727866808573405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,16,1,power_law_1.01,2.7907455444335936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,16,1,power_law_1.01,2.7991424560546876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,16,1,power_law_1.2,2.8337087631225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,16,1,power_law_1.2,2.8345920562744142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,2,1,balanced,9.499930699666342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,2,1,balanced,9.59495480855306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,2,1,power_law_1.01,10.156985473632812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,2,1,power_law_1.01,9.841458892822265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,2,1,power_law_1.2,10.235148620605468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,2,1,power_law_1.2,10.570015716552735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,32,1,balanced,2.2431413332621255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,32,1,balanced,2.243951956431071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,32,1,power_law_1.01,2.356710433959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,32,1,power_law_1.01,2.3606719970703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,32,1,power_law_1.2,2.382067108154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,32,1,power_law_1.2,2.3893760681152343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,4,1,balanced,5.333738962809245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,4,1,balanced,5.716784159342448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,4,1,power_law_1.01,5.729011154174804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,4,1,power_law_1.01,5.7485504150390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,4,1,power_law_1.2,5.804684829711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,4,1,power_law_1.2,5.823916625976563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,8,1,balanced,3.5397653579711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,8,1,balanced,3.5476160049438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,8,1,power_law_1.01,3.681932830810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,8,1,power_law_1.01,3.7364223480224608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,8,1,power_law_1.2,3.778335952758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,16384,7168,2048,8,384,8,1,power_law_1.2,3.8356224060058595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,1,balanced,0.21042132377624512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,1,balanced,0.2120373249053955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,1,power_law_1.01,0.21810560226440429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,1,power_law_1.01,0.21976959705352783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,1,power_law_1.2,0.22144639492034912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,1,power_law_1.2,0.22203519344329833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,128,balanced,0.046485334634780884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,128,balanced,0.0469706654548645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,128,power_law_1.01,0.04527359902858734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,128,power_law_1.01,0.046419200301170346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,128,power_law_1.2,0.047731199860572816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,128,power_law_1.2,0.04795520007610321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,16,balanced,0.05602666735649109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,16,balanced,0.05690133571624756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,16,power_law_1.01,0.05305600166320801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,16,power_law_1.01,0.054527997970581055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,16,power_law_1.2,0.05493119955062866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,16,power_law_1.2,0.05559679865837097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,2,balanced,0.13747732837994894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,2,balanced,0.13872533043225607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,2,power_law_1.01,0.133241605758667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,2,power_law_1.01,0.13415039777755738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,2,power_law_1.2,0.13025280237197875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,2,power_law_1.2,0.13240959644317626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,32,balanced,0.04753066599369049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,32,balanced,0.048058668772379555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,32,power_law_1.01,0.04585599899291992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,32,power_law_1.01,0.04604800045490265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,32,power_law_1.2,0.04612480103969574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,32,power_law_1.2,0.04619520008563995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,4,balanced,0.08963200449943542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,4,balanced,0.09126933415730794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,4,power_law_1.01,0.08647680282592773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,4,power_law_1.01,0.08820480108261108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,4,power_law_1.2,0.08880640268325805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,4,power_law_1.2,0.08892800211906433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,64,balanced,0.04671466847260793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,64,balanced,0.04770133395989736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,64,power_law_1.01,0.04462080001831055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,64,power_law_1.01,0.04469119906425476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,64,power_law_1.2,0.04500479996204376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,64,power_law_1.2,0.0457152009010315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,8,balanced,0.06824000179767609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,8,balanced,0.06838933130105336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,8,power_law_1.01,0.06552960276603699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,8,power_law_1.01,0.06636160016059875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,8,power_law_1.2,0.06592000126838685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,1,8,power_law_1.2,0.06878719925880432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,2,1,balanced,0.1341866652170817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,2,1,balanced,0.13554666439692178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,2,1,power_law_1.01,0.12821120023727417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,2,1,power_law_1.01,0.12872320413589478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,2,1,power_law_1.2,0.13022079467773437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,2,1,power_law_1.2,0.13108479976654053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,4,1,balanced,0.08739733695983887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,4,1,balanced,0.08901866277058919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,4,1,power_law_1.01,0.08399360179901123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,4,1,power_law_1.01,0.08509439826011658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,4,1,power_law_1.2,0.08554880023002624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2048,768,8,128,4,1,power_law_1.2,0.0856383979320526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,1,balanced,0.5909599860509237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,1,balanced,0.5932266712188721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,1,power_law_1.01,0.5766079902648926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,1,power_law_1.01,0.5804992198944092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,1,power_law_1.2,0.5820928096771241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,1,power_law_1.2,0.5913663864135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,128,balanced,0.06422399977842967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,128,balanced,0.0644160012404124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,128,power_law_1.01,0.06225280165672302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,128,power_law_1.01,0.06264320015907288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,128,power_law_1.2,0.06282240152359009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,128,power_law_1.2,0.06344320178031922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,16,balanced,0.08401599526405334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,16,balanced,0.08476266264915466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,16,power_law_1.01,0.07995520234107971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,16,power_law_1.01,0.08199040293693542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,16,power_law_1.2,0.08157439827919007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,16,power_law_1.2,0.08282880187034607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,2,balanced,0.35870933532714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,2,balanced,0.3626399834950765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,2,power_law_1.01,0.3220479965209961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,2,power_law_1.01,0.3258239984512329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,2,power_law_1.2,0.31843199729919436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,2,power_law_1.2,0.335097599029541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,32,balanced,0.07379200061162312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,32,balanced,0.07423999905586243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,32,power_law_1.01,0.07169920206069946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,32,power_law_1.01,0.07240960001945496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,32,power_law_1.2,0.07208319902420043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,32,power_law_1.2,0.07244160175323486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,4,balanced,0.20816532770792642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,4,balanced,0.21006399393081665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,4,power_law_1.01,0.19657599925994873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,4,power_law_1.01,0.19674240350723265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,4,power_law_1.2,0.1909183979034424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,4,power_law_1.2,0.19699840545654296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,64,balanced,0.06392533580462138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,64,balanced,0.06517333288987477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,64,power_law_1.01,0.0627776026725769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,64,power_law_1.01,0.06376320123672485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,64,power_law_1.2,0.06289280056953431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,64,power_law_1.2,0.06292480230331421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,8,balanced,0.1304746667544047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,8,balanced,0.13170133034388223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,8,power_law_1.01,0.11907839775085449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,8,power_law_1.01,0.125382399559021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,8,power_law_1.2,0.12430720329284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,1,8,power_law_1.2,0.12700159549713136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,16,1,balanced,0.21997332572937012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,16,1,balanced,0.2210293412208557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,16,1,power_law_1.01,0.20448000431060792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,16,1,power_law_1.01,0.2067392110824585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,16,1,power_law_1.2,0.20685439109802245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,16,1,power_law_1.2,0.21146240234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,2,1,balanced,0.348474661509196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,2,1,balanced,0.3508853514989217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,2,1,power_law_1.01,0.32439680099487306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,2,1,power_law_1.01,0.3267008066177368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,2,1,power_law_1.2,0.32354559898376467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,2,1,power_law_1.2,0.3300352096557617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,32,1,balanced,0.18910932540893555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,32,1,balanced,0.1893493334452311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,32,1,power_law_1.01,0.17004799842834473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,32,1,power_law_1.01,0.1732416033744812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,32,1,power_law_1.2,0.17660800218582154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,32,1,power_law_1.2,0.17876479625701905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,4,1,balanced,0.20445332924524942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,4,1,balanced,0.20529067516326904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,4,1,power_law_1.01,0.19422719478607178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,4,1,power_law_1.01,0.19583359956741334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,4,1,power_law_1.2,0.1972607970237732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,4,1,power_law_1.2,0.19803520441055297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,8,1,balanced,0.32205865780512494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,8,1,balanced,0.3229440053304036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,8,1,power_law_1.01,0.2993407964706421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,8,1,power_law_1.01,0.2999295949935913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,8,1,power_law_1.2,0.3071743965148926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,2688,1856,6,128,8,1,power_law_1.2,0.31090559959411623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,1,balanced,1.1643040180206299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,1,balanced,1.1676266988118489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,1,power_law_1.01,0.9692352294921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,1,power_law_1.01,0.991539192199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,1,power_law_1.2,0.9956159591674805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,1,power_law_1.2,0.9970560073852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,128,balanced,0.09698667128880818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,128,balanced,0.09699733058611552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,128,power_law_1.01,0.09437440037727356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,128,power_law_1.01,0.09511039853096008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,128,power_law_1.2,0.09516159892082214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,128,power_law_1.2,0.0951807975769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,16,balanced,0.15423466761906943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,16,balanced,0.15601066748301187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,16,power_law_1.01,0.14357759952545165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,16,power_law_1.01,0.14398720264434814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,16,power_law_1.2,0.13834240436553955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,16,power_law_1.2,0.14165120124816893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,2,balanced,0.6165226697921753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,2,balanced,0.6204586823781332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,2,power_law_1.01,0.5451712131500244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,2,power_law_1.01,0.5476928234100342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,2,power_law_1.2,0.5252543926239014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,2,power_law_1.2,0.5386303901672364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,256,balanced,0.09697066744168599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,256,balanced,0.09702400366465251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,256,power_law_1.01,0.09463040232658386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,256,power_law_1.01,0.09474560022354125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,256,power_law_1.2,0.09498239755630493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,256,power_law_1.2,0.09516159892082214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,32,balanced,0.11053333679835002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,32,balanced,0.11307199796040852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,32,power_law_1.01,0.1078976035118103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,32,power_law_1.01,0.1095039963722229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,32,power_law_1.2,0.10705280303955078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,32,power_law_1.2,0.10840320587158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,4,balanced,0.3556319872538249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,4,balanced,0.35734399159749347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,4,power_law_1.01,0.3219007968902588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,4,power_law_1.01,0.32890241146087645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,4,power_law_1.2,0.33048961162567136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,4,power_law_1.2,0.3389055967330933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,64,balanced,0.10102933645248413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,64,balanced,0.10321066776911418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,64,power_law_1.01,0.10034559965133667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,64,power_law_1.01,0.1007807970046997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,64,power_law_1.2,0.09989759922027588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,64,power_law_1.2,0.10067839622497558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,8,balanced,0.2171199917793274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,8,balanced,0.21990400552749634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,8,power_law_1.01,0.20271360874176025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,8,power_law_1.01,0.2061311960220337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,8,power_law_1.2,0.20236799716949463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,1,8,power_law_1.2,0.20473599433898926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,16,1,balanced,0.16249600052833557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,16,1,balanced,0.16421866416931152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,16,1,power_law_1.01,0.13256959915161132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,16,1,power_law_1.01,0.13691519498825072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,16,1,power_law_1.2,0.133951997756958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,16,1,power_law_1.2,0.13605120182037353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,2,1,balanced,0.6023413340250651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,2,1,balanced,0.6031306584676107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,2,1,power_law_1.01,0.5064511775970459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,2,1,power_law_1.01,0.5181632041931152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,2,1,power_law_1.2,0.5224959850311279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,2,1,power_law_1.2,0.5270016193389893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,32,1,balanced,0.1197119951248169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,32,1,balanced,0.12128000458081563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,32,1,power_law_1.01,0.11350400447845459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,32,1,power_law_1.01,0.11448320150375366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,32,1,power_law_1.2,0.11319680213928222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,32,1,power_law_1.2,0.1137984037399292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,4,1,balanced,0.3368426561355591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,4,1,balanced,0.3377973238627116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,4,1,power_law_1.01,0.28764159679412843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,4,1,power_law_1.01,0.301689600944519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,4,1,power_law_1.2,0.2849663972854614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,4,1,power_law_1.2,0.29644160270690917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,8,1,balanced,0.20414932568868002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,8,1,balanced,0.205402672290802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,8,1,power_law_1.01,0.18795520067214966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,8,1,power_law_1.01,0.18818559646606445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,8,1,power_law_1.2,0.18629759550094604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,3072,1536,8,256,8,1,power_law_1.2,0.1883072018623352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,1,balanced,0.517136017481486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,1,balanced,0.5173706610997518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,1,power_law_1.01,0.5698368072509765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,1,power_law_1.01,0.5831679821014404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,1,power_law_1.2,0.5874688148498535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,1,power_law_1.2,0.5952000141143798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,2,balanced,0.3408426841100057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,2,balanced,0.341103990872701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,2,power_law_1.01,0.41083521842956544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,2,power_law_1.01,0.41179518699645995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,2,power_law_1.2,0.3860224008560181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,2,power_law_1.2,0.39560320377349856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,4,balanced,0.25939200321833294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,4,balanced,0.26159467299779254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,4,power_law_1.01,0.29660160541534425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,4,power_law_1.01,0.30568320751190187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,4,power_law_1.2,0.2939840078353882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,4,power_law_1.2,0.3001471996307373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,8,balanced,0.21585599581400552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,8,balanced,0.21983999013900757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,8,power_law_1.01,0.2329792022705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,8,power_law_1.01,0.2403007984161377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,8,power_law_1.2,0.23676800727844238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,1,8,power_law_1.2,0.24038400650024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,16,1,balanced,0.07634666562080383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,16,1,balanced,0.07659199833869934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,16,1,power_law_1.01,0.07775359749794006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,16,1,power_law_1.01,0.07807360291481018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,16,1,power_law_1.2,0.07669119834899903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,16,1,power_law_1.2,0.07738239765167236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,2,1,balanced,0.28597333033879596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,2,1,balanced,0.2861386736234029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,2,1,power_law_1.01,0.28549120426177976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,2,1,power_law_1.01,0.30188798904418945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,2,1,power_law_1.2,0.2898303985595703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,2,1,power_law_1.2,0.30593280792236327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,32,1,balanced,0.059434667229652405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,32,1,balanced,0.0629066675901413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,32,1,power_law_1.01,0.0648959994316101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,32,1,power_law_1.01,0.06647679805755616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,32,1,power_law_1.2,0.06417919993400574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,32,1,power_law_1.2,0.0665727972984314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,4,1,balanced,0.17285333077112833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,4,1,balanced,0.1739786664644877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,4,1,power_law_1.01,0.17048319578170776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,4,1,power_law_1.01,0.17179520130157472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,4,1,power_law_1.2,0.169376003742218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,4,1,power_law_1.2,0.17423360347747802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,8,1,balanced,0.09962133566538493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,8,1,balanced,0.10134933392206828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,8,1,power_law_1.01,0.09902719855308532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,8,1,power_law_1.01,0.1004480004310608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,8,1,power_law_1.2,0.10049279928207397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,14336,2,8,8,1,power_law_1.2,0.10116480588912964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,1,balanced,0.7839146455128988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,1,balanced,0.7872373263041178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,1,power_law_1.01,0.7540031909942627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,1,power_law_1.01,0.7649983882904052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,1,power_law_1.2,0.7589951992034912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,1,power_law_1.2,0.7723199844360351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,128,balanced,0.07913599908351898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,128,balanced,0.07964266836643219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,128,power_law_1.01,0.07614719867706299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,128,power_law_1.01,0.0781440019607544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,128,power_law_1.2,0.081523197889328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,128,power_law_1.2,0.08323839902877808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,16,balanced,0.11183999975522359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,16,balanced,0.11309867103894551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,16,power_law_1.01,0.10823680162429809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,16,power_law_1.01,0.10937600135803223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,16,power_law_1.2,0.10879360437393189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,16,power_law_1.2,0.11093759536743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,2,balanced,0.4329386552174886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,2,balanced,0.4334346850713094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,2,power_law_1.01,0.41409921646118164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,2,power_law_1.01,0.4225152015686035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,2,power_law_1.2,0.4136320114135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,2,power_law_1.2,0.42984957695007325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,32,balanced,0.0974026620388031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,32,balanced,0.09790933132171631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,32,power_law_1.01,0.09658880233764648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,32,power_law_1.01,0.09746559858322143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,32,power_law_1.2,0.09794560074806213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,32,power_law_1.2,0.09831680059432983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,4,balanced,0.24819199244181314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,4,balanced,0.24964799483617148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,4,power_law_1.01,0.23716480731964112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,4,power_law_1.01,0.24464640617370606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,4,power_law_1.2,0.23550078868865967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,4,power_law_1.2,0.24579200744628907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,64,balanced,0.08957866827646892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,64,balanced,0.09091200431187947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,64,power_law_1.01,0.08767359852790832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,64,power_law_1.01,0.08965759873390197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,64,power_law_1.2,0.09052159786224365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,64,power_law_1.2,0.09063680171966552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,8,balanced,0.16038933396339417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,8,balanced,0.1607306698958079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,8,power_law_1.01,0.15393919944763185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,8,power_law_1.01,0.15479040145874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,8,power_law_1.2,0.15648000240325927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,1,8,power_law_1.2,0.1647487998008728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,16,1,balanced,0.12148267030715942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,16,1,balanced,0.12155733505884807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,16,1,power_law_1.01,0.11781760454177856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,16,1,power_law_1.01,0.1184000015258789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,16,1,power_law_1.2,0.11853439807891845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,16,1,power_law_1.2,0.11880960464477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,2,1,balanced,0.3970346848169963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,2,1,balanced,0.3992106517155965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,2,1,power_law_1.01,0.40378880500793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,2,1,power_law_1.01,0.40590081214904783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,2,1,power_law_1.2,0.4089344024658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,2,1,power_law_1.2,0.41403517723083494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,32,1,balanced,0.1049173374970754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,32,1,balanced,0.10736533006032307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,32,1,power_law_1.01,0.10241919755935669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,32,1,power_law_1.01,0.10372480154037475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,32,1,power_law_1.2,0.10422400236129761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,32,1,power_law_1.2,0.10535680055618286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,4,1,balanced,0.23730667432149252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,4,1,balanced,0.2380639910697937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,4,1,power_law_1.01,0.22834560871124268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,4,1,power_law_1.01,0.2302016019821167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,4,1,power_law_1.2,0.2286463975906372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,4,1,power_law_1.2,0.2297215938568115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,8,1,balanced,0.1516426702340444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,8,1,balanced,0.1540426711241404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,8,1,power_law_1.01,0.14585599899291993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,8,1,power_law_1.01,0.14737279415130616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,8,1,power_law_1.2,0.14743679761886597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,1536,8,128,8,1,power_law_1.2,0.14972800016403198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,1,balanced,5.420442581176758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,1,balanced,5.433743794759114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,1,power_law_1.01,4.767417526245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,1,power_law_1.01,4.875398254394531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,1,power_law_1.2,4.93493766784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,1,power_law_1.2,4.965977478027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,128,balanced,0.2914026578267415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,128,balanced,0.2921866575876872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,128,power_law_1.01,0.29003520011901857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,128,power_law_1.01,0.29113600254058836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,128,power_law_1.2,0.2903167963027954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,128,power_law_1.2,0.29034879207611086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,16,balanced,0.593994657198588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,16,balanced,0.5953066746393839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,16,power_law_1.01,0.5573503971099854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,16,power_law_1.01,0.5641280174255371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,16,power_law_1.2,0.5562560081481933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,16,power_law_1.2,0.5606016159057617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,2,balanced,2.7494239807128906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,2,balanced,2.8545920054117837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,2,power_law_1.01,2.5536895751953126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,2,power_law_1.01,2.558393669128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,2,power_law_1.2,2.530067253112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,2,power_law_1.2,2.5541887283325195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,256,balanced,0.28062933683395386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,256,balanced,0.2813013394673665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,256,power_law_1.01,0.27991681098937987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,256,power_law_1.01,0.2805504083633423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,256,power_law_1.2,0.28104960918426514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,256,power_law_1.2,0.28142080307006834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,32,balanced,0.4272693395614624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,32,balanced,0.4275733232498169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,32,power_law_1.01,0.4174015998840332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,32,power_law_1.01,0.41805438995361327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,32,power_law_1.2,0.41534719467163084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,32,power_law_1.2,0.41797761917114257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,4,balanced,1.512447992960612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,4,balanced,1.5132427215576172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,4,power_law_1.01,1.381382369995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,4,power_law_1.01,1.3896191596984864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,4,power_law_1.2,1.4172608375549316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,4,power_law_1.2,1.4213055610656737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,64,balanced,0.3283039927482605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,64,balanced,0.3284533421198527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,64,power_law_1.01,0.3231359958648682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,64,power_law_1.01,0.3258687973022461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,64,power_law_1.2,0.3216768026351929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,64,power_law_1.2,0.3235327959060669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,8,balanced,0.895962635676066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,8,balanced,0.8988800048828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,8,power_law_1.01,0.8482496261596679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,8,power_law_1.01,0.8508928298950196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,8,power_law_1.2,0.8435263633728027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,1,8,power_law_1.2,0.844428825378418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,16,1,balanced,1.4566292762756348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,16,1,balanced,1.4580319722493489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,16,1,power_law_1.01,1.3095616340637206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,16,1,power_law_1.01,1.3396672248840331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,16,1,power_law_1.2,1.3445887565612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,16,1,power_law_1.2,1.3509440422058105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,2,1,balanced,2.497231960296631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,2,1,balanced,2.5058080355326333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,2,1,power_law_1.01,2.2717567443847657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,2,1,power_law_1.01,2.284115219116211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,2,1,power_law_1.2,2.3816768646240236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,2,1,power_law_1.2,2.412601661682129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,32,1,balanced,1.1500799655914307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,32,1,balanced,1.1507253646850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,32,1,power_law_1.01,1.0607168197631835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,32,1,power_law_1.01,1.0621760368347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,32,1,power_law_1.2,1.072704029083252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,32,1,power_law_1.2,1.0822079658508301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,4,1,balanced,1.3988906542460124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,4,1,balanced,1.400053342183431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,4,1,power_law_1.01,1.3093695640563965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,4,1,power_law_1.01,1.3135040283203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,4,1,power_law_1.2,1.3545727729797363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,4,1,power_law_1.2,1.3682623863220216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,8,1,balanced,0.7817920049031576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,8,1,balanced,0.7867946624755859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,8,1,power_law_1.01,0.7326720237731934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,8,1,power_law_1.01,0.7386879920959473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,8,1,power_law_1.2,0.7363584041595459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,4096,2688,22,512,8,1,power_law_1.2,0.7406079769134521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,1,balanced,0.804154634475708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,1,balanced,0.8042453130086263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,1,power_law_1.01,1.0704256057739259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,1,power_law_1.01,1.0745471954345702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,1,power_law_1.2,1.0165760040283203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,1,power_law_1.2,1.0443455696105957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,2,balanced,0.48636798063913983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,2,balanced,0.48640533288319904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,2,power_law_1.01,0.5681600093841552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,2,power_law_1.01,0.5854400157928467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,2,power_law_1.2,0.5373184204101562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,2,power_law_1.2,0.6191232204437256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,4,balanced,0.3404159943262736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,4,balanced,0.3413013219833374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,4,power_law_1.01,0.3935487985610962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,4,power_law_1.01,0.4123392105102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,4,power_law_1.2,0.3874176025390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,4,power_law_1.2,0.42035841941833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,8,balanced,0.26648000876108807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,8,balanced,0.26823999484380084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,8,power_law_1.01,0.3047744035720825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,8,power_law_1.01,0.308076810836792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,8,power_law_1.2,0.3067647933959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,1,8,power_law_1.2,0.3090303897857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,16,1,balanced,0.10569066802660625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,16,1,balanced,0.10691199700037639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,16,1,power_law_1.01,0.11012480258941651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,16,1,power_law_1.01,0.11182719469070435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,16,1,power_law_1.2,0.11139199733734131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,16,1,power_law_1.2,0.11196160316467285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,2,1,balanced,0.43646931648254395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,2,1,balanced,0.44088534514109295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,2,1,power_law_1.01,0.5174719810485839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,2,1,power_law_1.01,0.5183487892150879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,2,1,power_law_1.2,0.5275199890136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,2,1,power_law_1.2,0.5531328201293946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,32,1,balanced,0.09124267101287842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,32,1,balanced,0.09125333031018575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,32,1,power_law_1.01,0.09281280040740966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,32,1,power_law_1.01,0.09376000165939331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,32,1,power_law_1.2,0.09197440147399902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,32,1,power_law_1.2,0.09407359957695008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,4,1,balanced,0.2571840087572734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,4,1,balanced,0.26074665784835815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,4,1,power_law_1.01,0.2694080114364624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,4,1,power_law_1.01,0.2731328010559082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,4,1,power_law_1.2,0.2703423976898193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,4,1,power_law_1.2,0.2748095989227295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,8,1,balanced,0.13889599839846292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,8,1,balanced,0.1434719959894816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,8,1,power_law_1.01,0.1502784013748169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,8,1,power_law_1.01,0.1512895941734314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,8,1,power_law_1.2,0.15023360252380372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,16384,2,8,8,1,power_law_1.2,0.15092480182647705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,1,balanced,3.0435412724812827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,1,balanced,3.1355679829915366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,1,power_law_1.01,2.5792640686035155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,1,power_law_1.01,2.5995199203491213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,1,power_law_1.2,2.5235904693603515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,1,power_law_1.2,2.538438415527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,128,balanced,0.16051200032234192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,128,balanced,0.16220266620318094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,128,power_law_1.01,0.15892479419708253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,128,power_law_1.01,0.15957759618759154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,128,power_law_1.2,0.1582527995109558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,128,power_law_1.2,0.15916160345077515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,16,balanced,0.32066667079925537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,16,balanced,0.321941335995992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,16,power_law_1.01,0.30186240673065184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,16,power_law_1.01,0.3070208072662354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,16,power_law_1.2,0.304915189743042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,16,power_law_1.2,0.31269121170043945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,2,balanced,1.5665705998738606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,2,balanced,1.5904906590779622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,2,power_law_1.01,1.3439167976379394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,2,power_law_1.01,1.3488320350646972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,2,power_law_1.2,1.362668800354004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,2,power_law_1.2,1.3758079528808593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,256,balanced,0.15914133191108704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,256,balanced,0.15972266594568887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,256,power_law_1.01,0.15471359491348266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,256,power_law_1.01,0.1550271987915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,256,power_law_1.2,0.15467519760131837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,256,power_law_1.2,0.1556607961654663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,32,balanced,0.2076746622721354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,32,balanced,0.20854399601618448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,32,power_law_1.01,0.19664000272750853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,32,power_law_1.01,0.19903359413146973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,32,power_law_1.2,0.19809279441833497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,32,power_law_1.2,0.2015552043914795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,4,balanced,0.8387946287790934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,4,balanced,0.8391199906667074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,4,power_law_1.01,0.7419968128204346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,4,power_law_1.01,0.7875584125518799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,4,power_law_1.2,0.7458111763000488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,4,power_law_1.2,0.7717055797576904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,64,balanced,0.16863999764124551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,64,balanced,0.17049066225687662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,64,power_law_1.01,0.16655999422073364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,64,power_law_1.01,0.1670912027359009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,64,power_law_1.2,0.16687999963760375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,64,power_law_1.2,0.16725759506225585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,8,balanced,0.49161601066589355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,8,balanced,0.4935306708017985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,8,power_law_1.01,0.4483583927154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,8,power_law_1.01,0.466809606552124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,8,power_law_1.2,0.4497856140136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,1,8,power_law_1.2,0.4748095989227295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,16,1,balanced,0.323034663995107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,16,1,balanced,0.3243680000305176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,16,1,power_law_1.01,0.2603840112686157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,16,1,power_law_1.01,0.2761087894439697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,16,1,power_law_1.2,0.26056320667266847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,16,1,power_law_1.2,0.2873536109924316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,2,1,balanced,1.5451946258544922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,2,1,balanced,1.546170711517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,2,1,power_law_1.01,1.3150912284851075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,2,1,power_law_1.01,1.355673599243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,2,1,power_law_1.2,1.3304767608642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,2,1,power_law_1.2,1.3400896072387696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,32,1,balanced,0.22493332624435425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,32,1,balanced,0.22516266504923502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,32,1,power_law_1.01,0.20850560665130616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,32,1,power_law_1.01,0.2108288049697876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,32,1,power_law_1.2,0.21003520488739014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,32,1,power_law_1.2,0.21064960956573486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,4,1,balanced,0.800976037979126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,4,1,balanced,0.8014240264892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,4,1,power_law_1.01,0.6785920143127442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,4,1,power_law_1.01,0.7085375785827637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,4,1,power_law_1.2,0.6768576145172119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,4,1,power_law_1.2,0.6826560020446777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,8,1,balanced,0.4737226565678914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,8,1,balanced,0.47512535254160565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,8,1,power_law_1.01,0.39439361095428466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,8,1,power_law_1.01,0.4104000091552734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,8,1,power_law_1.2,0.4104447841644287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2048,8,256,8,1,power_law_1.2,0.41858558654785155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,1,balanced,2.3909494082132974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,1,balanced,2.427994728088379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,1,power_law_1.01,2.1567487716674805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,1,power_law_1.01,2.163552093505859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,1,power_law_1.2,2.2368383407592773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,1,power_law_1.2,2.276889610290527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,16,balanced,0.2505813241004944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,16,balanced,0.2529866695404053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,16,power_law_1.01,0.23008639812469484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,16,power_law_1.01,0.23995521068572997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,16,power_law_1.2,0.241759991645813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,16,power_law_1.2,0.25240321159362794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,2,balanced,1.2491412957509358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,2,balanced,1.2613866329193115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,2,power_law_1.01,1.1351296424865722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,2,power_law_1.01,1.168070411682129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,2,power_law_1.2,1.1419967651367187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,2,power_law_1.2,1.2080896377563477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,32,balanced,0.16236799955368042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,32,balanced,0.16260266304016113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,32,power_law_1.01,0.1555392026901245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,32,power_law_1.01,0.16016639471054078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,32,power_law_1.2,0.16060160398483275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,32,power_law_1.2,0.1634752035140991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,4,balanced,0.6612853209177653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,4,balanced,0.6649706761042277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,4,power_law_1.01,0.6298495769500733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,4,power_law_1.01,0.6394048213958741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,4,power_law_1.2,0.6267007827758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,4,power_law_1.2,0.6501503944396972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,8,balanced,0.3816479841868083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,8,balanced,0.3820426861445109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,8,power_law_1.01,0.3680959939956665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,8,power_law_1.01,0.37084159851074217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,8,power_law_1.2,0.3741055965423584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,1,8,power_law_1.2,0.37562239170074463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,16,1,balanced,0.26581867535909015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,16,1,balanced,0.2660213311513265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,16,1,power_law_1.01,0.2334144115447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,16,1,power_law_1.01,0.24232959747314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,16,1,power_law_1.2,0.2520576000213623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,16,1,power_law_1.2,0.2601855993270874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,2,1,balanced,1.2243093649546306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,2,1,balanced,1.226080020268758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,2,1,power_law_1.01,1.1004608154296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,2,1,power_law_1.01,1.1192383766174316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,2,1,power_law_1.2,1.1398591995239258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,2,1,power_law_1.2,1.140409564971924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,32,1,balanced,0.18614399433135986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,32,1,balanced,0.1864479978879293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,32,1,power_law_1.01,0.1768447995185852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,32,1,power_law_1.01,0.17868800163269044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,32,1,power_law_1.2,0.17844480276107788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,32,1,power_law_1.2,0.1796288013458252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,4,1,balanced,0.6377866665522257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,4,1,balanced,0.6387679974238077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,4,1,power_law_1.01,0.607206392288208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,4,1,power_law_1.01,0.6079808235168457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,4,1,power_law_1.2,0.617625617980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,4,1,power_law_1.2,0.6177728176116943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,8,1,balanced,0.358512004216512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,8,1,power_law_1.01,0.34177920818328855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,8,1,power_law_1.01,0.34311680793762206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,8,1,power_law_1.2,0.3442303895950317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,6144,2560,8,160,8,1,power_law_1.2,0.34621438980102537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,1,balanced,3.558346748352051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,1,balanced,3.563701311747233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,1,power_law_1.01,3.052038383483887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,1,power_law_1.01,3.059040069580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,1,power_law_1.2,2.9503488540649414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,1,power_law_1.2,3.026630401611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,128,balanced,0.18370133638381958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,128,balanced,0.18475733200709024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,128,power_law_1.01,0.18126720190048218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,128,power_law_1.01,0.1814463973045349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,128,power_law_1.2,0.17912960052490234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,128,power_law_1.2,0.18190720081329345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,16,balanced,0.38231468200683594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,16,balanced,0.38436798254648846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,16,power_law_1.01,0.33422720432281494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,16,power_law_1.01,0.34593920707702636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,16,power_law_1.2,0.3601279973983765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,16,power_law_1.2,0.36253440380096436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,2,balanced,1.8898293177286785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,2,balanced,1.9062879880269368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,2,power_law_1.01,1.5314687728881835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,2,power_law_1.01,1.5666496276855468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,2,power_law_1.2,1.5828160285949706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,2,power_law_1.2,1.5894847869873048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,256,balanced,0.18068800369898477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,256,balanced,0.18198400735855103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,256,power_law_1.01,0.17804160118103027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,256,power_law_1.01,0.17827839851379396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,256,power_law_1.2,0.17782399654388428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,256,power_law_1.2,0.1786687970161438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,32,balanced,0.24741866191228232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,32,balanced,0.24816532929738364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,32,power_law_1.01,0.23232638835906982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,32,power_law_1.01,0.23271679878234863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,32,power_law_1.2,0.23558399677276612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,32,power_law_1.2,0.23630080223083497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,4,balanced,0.9792746702829996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,4,balanced,0.9813066323598226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,4,power_law_1.01,0.8774335861206055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,4,power_law_1.01,0.8962752342224121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,4,power_law_1.2,0.8713791847229004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,4,power_law_1.2,0.8993344306945801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,64,balanced,0.19369600216547647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,64,balanced,0.194815993309021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,64,power_law_1.01,0.19088640213012695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,64,power_law_1.01,0.19134080410003662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,64,power_law_1.2,0.18891520500183107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,64,power_law_1.2,0.19182080030441284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,8,balanced,0.580623984336853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,8,balanced,0.5856639941533407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,8,power_law_1.01,0.5437503814697265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,8,power_law_1.01,0.5531519889831543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,8,power_law_1.2,0.5402431964874268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,1,8,power_law_1.2,0.5512896060943604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,16,1,balanced,0.37668800354003906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,16,1,balanced,0.3784426848093669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,16,1,power_law_1.01,0.2989376068115234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,16,1,power_law_1.01,0.305516791343689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,16,1,power_law_1.2,0.321727991104126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,16,1,power_law_1.2,0.32364161014556886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,2,1,balanced,1.8093172709147136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,2,1,balanced,1.8756213188171387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,2,1,power_law_1.01,1.5255616188049317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,2,1,power_law_1.01,1.5326144218444824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,2,1,power_law_1.2,1.551743984222412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,2,1,power_law_1.2,1.5739328384399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,32,1,balanced,0.25838400920232135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,32,1,balanced,0.2589706579844157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,32,1,power_law_1.01,0.23965439796447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,32,1,power_law_1.01,0.2418368101119995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,32,1,power_law_1.2,0.24184319972991944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,32,1,power_law_1.2,0.24191360473632811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,4,1,balanced,0.9343679745992025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,4,1,balanced,0.9369440078735352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,4,1,power_law_1.01,0.7918399810791016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,4,1,power_law_1.01,0.8201663970947266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,4,1,power_law_1.2,0.8133567810058594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,4,1,power_law_1.2,0.8309696197509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,8,1,balanced,0.556170662244161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,8,1,balanced,0.5562933286031088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,8,1,power_law_1.01,0.47362561225891114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,8,1,power_law_1.01,0.48625922203063965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,8,1,power_law_1.2,0.47324161529541015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,256,8,1,power_law_1.2,0.5102528095245361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,1,balanced,5.4637495676676435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,1,balanced,5.491903940836589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,1,power_law_1.01,4.119161605834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,1,power_law_1.01,4.1573951721191404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,1,power_law_1.2,4.060588836669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,1,power_law_1.2,4.208729553222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,128,balanced,0.2339199980099996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,128,balanced,0.23407467206319174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,128,power_law_1.01,0.22994558811187743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,128,power_law_1.01,0.23033599853515624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,128,power_law_1.2,0.22807040214538574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,128,power_law_1.2,0.2316351890563965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,16,balanced,0.5106613238652548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,16,balanced,0.5130453507105509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,16,power_law_1.01,0.4523327827453613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,16,power_law_1.01,0.467468786239624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,16,power_law_1.2,0.45044479370117185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,16,power_law_1.2,0.4664000034332275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,2,balanced,2.6717281341552734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,2,balanced,2.76798407236735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,2,power_law_1.01,2.0948543548583984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,2,power_law_1.01,2.1537023544311524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,2,power_law_1.2,2.076326370239258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,2,power_law_1.2,2.2171648025512694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,32,balanced,0.3550560077031453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,32,balanced,0.3550773461659749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,32,power_law_1.01,0.33050239086151123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,32,power_law_1.01,0.33568639755249025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,32,power_law_1.2,0.3109760046005249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,32,power_law_1.2,0.316102409362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,4,balanced,1.4458773930867512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,4,balanced,1.4526559511820476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,4,power_law_1.01,1.1351615905761718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,4,power_law_1.01,1.2077759742736816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,4,power_law_1.2,1.110489559173584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,4,power_law_1.2,1.1618687629699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,64,balanced,0.25916266441345215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,64,balanced,0.25989866256713867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,64,power_law_1.01,0.24836480617523193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,64,power_law_1.01,0.2512063980102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,64,power_law_1.2,0.24675838947296141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,64,power_law_1.2,0.25153920650482176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,8,balanced,0.8221973578135172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,8,balanced,0.8295199871063232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,8,power_law_1.01,0.6906559944152832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,8,power_law_1.01,0.7102272033691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,8,power_law_1.2,0.7028992176055908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,1,8,power_law_1.2,0.7627903938293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,16,1,balanced,0.4893813530604045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,16,1,balanced,0.49328001340230304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,16,1,power_law_1.01,0.43077759742736815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,16,1,power_law_1.01,0.43434882164001465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,16,1,power_law_1.2,0.42887039184570314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,16,1,power_law_1.2,0.42899198532104493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,2,1,balanced,2.7334025700887046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,2,1,balanced,2.7745866775512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,2,1,power_law_1.01,2.143654441833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,2,1,power_law_1.01,2.149247932434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,2,1,power_law_1.2,2.0897151947021486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,2,1,power_law_1.2,2.097977638244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,32,1,balanced,0.353274663289388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,32,1,balanced,0.3558719952901204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,32,1,power_law_1.01,0.31146879196166993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,32,1,power_law_1.01,0.313702392578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,32,1,power_law_1.2,0.31008639335632326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,32,1,power_law_1.2,0.31127679347991943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,4,1,balanced,1.3707626660664876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,4,1,balanced,1.3808693885803223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,4,1,power_law_1.01,1.0988991737365723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,4,1,power_law_1.01,1.1116543769836427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,4,1,power_law_1.2,1.1014975547790526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,4,1,power_law_1.2,1.1070528030395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,8,1,balanced,0.7833706537882487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,8,1,balanced,0.7868533134460449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,8,1,power_law_1.01,0.6317759990692139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,8,1,power_law_1.01,0.6321407794952393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,8,1,power_law_1.2,0.6302656173706055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,192,7168,2048,8,384,8,1,power_law_1.2,0.635539197921753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,1,balanced,0.04140799989302953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,1,balanced,0.04179200033346812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,1,power_law_1.01,0.03986560106277466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,1,power_law_1.01,0.04203520119190216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,1,power_law_1.2,0.04056960046291351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,1,power_law_1.2,0.04163840115070343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,128,balanced,0.027034667630990345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,128,balanced,0.029285334050655365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,128,power_law_1.01,0.02588160037994385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,128,power_law_1.01,0.027193599939346315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,128,power_law_1.2,0.026598399877548216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,128,power_law_1.2,0.027263998985290527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,16,balanced,0.02917333443959554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,16,balanced,0.029285334050655365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,16,power_law_1.01,0.03294720053672791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,16,power_law_1.01,0.03345920145511627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,16,power_law_1.2,0.03330560028553009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,16,power_law_1.2,0.03384959995746613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,2,balanced,0.03526933242877325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,2,balanced,0.046053335070610046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,2,power_law_1.01,0.04350079894065857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,2,power_law_1.01,0.0455487996339798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,2,power_law_1.2,0.040908798575401306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,2,power_law_1.2,0.042105600237846375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,32,balanced,0.02784000088771184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,32,balanced,0.029194665451844532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,32,power_law_1.01,0.027968001365661622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,32,power_law_1.01,0.02903040051460266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,32,power_law_1.2,0.028064000606536865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,32,power_law_1.2,0.028857600688934327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,4,balanced,0.029631999631722767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,4,balanced,0.03181866556406021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,4,power_law_1.01,0.04255360066890716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,4,power_law_1.01,0.04266240000724793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,4,power_law_1.2,0.037510401010513304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,4,power_law_1.2,0.038406398892402646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,64,balanced,0.02918400118748347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,64,balanced,0.029264000554879505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,64,power_law_1.01,0.026655998826026917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,64,power_law_1.01,0.027136000990867614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,64,power_law_1.2,0.02645759880542755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,64,power_law_1.2,0.0274944007396698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,8,balanced,0.02733866622050603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,8,balanced,0.027429332335789997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,8,power_law_1.01,0.036857599020004274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,8,power_law_1.01,0.04106239974498749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,8,power_law_1.2,0.03454079926013946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,1,8,power_law_1.2,0.03548159897327423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,2,1,balanced,0.03130666663249334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,2,1,balanced,0.03148266673088074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,2,1,power_law_1.01,0.030329599976539612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,2,1,power_law_1.01,0.03201279938220978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,2,1,power_law_1.2,0.030527999997138976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,2,1,power_law_1.2,0.030700799822807313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,4,1,balanced,0.027274665733178455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,4,1,balanced,0.027402666707833607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,4,1,power_law_1.01,0.026745599508285523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,4,1,power_law_1.01,0.02736000120639801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,4,1,power_law_1.2,0.026169601082801818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2048,768,8,128,4,1,power_law_1.2,0.02675839960575104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,1,balanced,0.0740533322095871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,1,balanced,0.07436266541481018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,1,power_law_1.01,0.07326719760894776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,1,power_law_1.01,0.07333120107650756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,1,power_law_1.2,0.07227519750595093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,1,power_law_1.2,0.07319039702415467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,128,balanced,0.03346666693687439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,128,balanced,0.03374933451414108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,128,power_law_1.01,0.031167998909950256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,128,power_law_1.01,0.031999999284744264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,128,power_law_1.2,0.031673601269721983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,128,power_law_1.2,0.032416000962257385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,16,balanced,0.03333866596221924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,16,balanced,0.033439998825391136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,16,power_law_1.01,0.06723200082778931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,16,power_law_1.01,0.06796799898147583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,16,power_law_1.2,0.05348479747772217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,16,power_law_1.2,0.05661439895629883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,2,balanced,0.056458666920661926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,2,balanced,0.0580213318268458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,2,power_law_1.01,0.08650879859924317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,2,power_law_1.01,0.08734719753265381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,2,power_law_1.2,0.0779263973236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,2,power_law_1.2,0.07902079820632935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,32,balanced,0.03350933392842611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,32,balanced,0.033573334415753685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,32,power_law_1.01,0.04547840058803558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,32,power_law_1.01,0.045484799146652224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,32,power_law_1.2,0.04542079865932465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,32,power_law_1.2,0.046348801255226134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,4,balanced,0.041152000427246094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,4,balanced,0.04153066625197729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,4,power_law_1.01,0.08097919821739197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,4,power_law_1.01,0.08498560190200806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,4,power_law_1.2,0.06099839806556702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,4,power_law_1.2,0.06312320232391358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,64,balanced,0.033370666205883026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,64,balanced,0.03339733431736628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,64,power_law_1.01,0.03477759957313538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,64,power_law_1.01,0.03516800105571747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,64,power_law_1.2,0.03550080060958862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,64,power_law_1.2,0.03603839874267578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,8,balanced,0.037690666814645134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,8,balanced,0.03788266579310099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,8,power_law_1.01,0.08216320276260376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,8,power_law_1.01,0.08478080034255982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,8,power_law_1.2,0.06588159799575806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,1,8,power_law_1.2,0.07225599884986877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,16,1,balanced,0.03733866661787033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,16,1,balanced,0.03770666569471359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,16,1,power_law_1.01,0.03603839874267578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,16,1,power_law_1.01,0.03620480000972748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,16,1,power_law_1.2,0.037036800384521486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,16,1,power_law_1.2,0.03770880103111267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,2,1,balanced,0.05309866865475973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,2,1,balanced,0.05402666827042898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,2,1,power_law_1.01,0.051641601324081424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,2,1,power_law_1.01,0.05172479748725891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,2,1,power_law_1.2,0.051718401908874514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,2,1,power_law_1.2,0.05182719826698303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,32,1,balanced,0.03798400113979975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,32,1,balanced,0.03818133225043615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,32,1,power_law_1.01,0.036134400963783266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,32,1,power_law_1.01,0.036160001158714296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,32,1,power_law_1.2,0.03552640080451965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,32,1,power_law_1.2,0.03624959886074066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,4,1,balanced,0.0354720006386439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,4,1,balanced,0.03740799923737844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,4,1,power_law_1.01,0.035104000568389894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,4,1,power_law_1.01,0.03527039885520935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,4,1,power_law_1.2,0.03529599905014038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,4,1,power_law_1.2,0.038815999031066896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,8,1,balanced,0.04174399872620901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,8,1,balanced,0.04320533573627472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,8,1,power_law_1.01,0.040863999724388124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,8,1,power_law_1.01,0.0419840008020401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,8,1,power_law_1.2,0.045151999592781066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,2688,1856,6,128,8,1,power_law_1.2,0.045414400100708005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,1,balanced,0.094842662413915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,1,balanced,0.09675733248392741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,1,power_law_1.01,0.09112319946289063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,1,power_law_1.01,0.09128959774971009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,1,power_law_1.2,0.09525759816169739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,1,power_law_1.2,0.10103679895401001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,128,balanced,0.03159466634194056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,128,balanced,0.03310933212439219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,128,power_law_1.01,0.031795200705528257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,128,power_law_1.01,0.03180800080299377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,128,power_law_1.2,0.03198719918727875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,128,power_law_1.2,0.03221760094165802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,16,balanced,0.0334346666932106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,16,balanced,0.03359466542800268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,16,power_law_1.01,0.09518719911575317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,16,power_law_1.01,0.09524480104446412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,16,power_law_1.2,0.0929472029209137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,16,power_law_1.2,0.09523199796676636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,2,balanced,0.0622026671965917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,2,balanced,0.06226666768391927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,2,power_law_1.01,0.09666560292243957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,2,power_law_1.01,0.09749119877815246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,2,power_law_1.2,0.09540479779243469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,2,power_law_1.2,0.09556480050086975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,256,balanced,0.03188266605138779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,256,balanced,0.0331839993596077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,256,power_law_1.01,0.03113600015640259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,256,power_law_1.01,0.03126400113105774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,256,power_law_1.2,0.031302401423454286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,256,power_law_1.2,0.031481599807739256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,32,balanced,0.031850665807724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,32,balanced,0.03322133421897888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,32,power_law_1.01,0.0596671998500824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,32,power_law_1.01,0.06056960225105286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,32,power_law_1.2,0.05937280058860779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,32,power_law_1.2,0.059622400999069215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,4,balanced,0.04952533543109894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,4,balanced,0.051738664507865906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,4,power_law_1.01,0.09520639777183533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,4,power_law_1.01,0.09541760087013244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,4,power_law_1.2,0.09371520280838012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,4,power_law_1.2,0.09507840275764465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,64,balanced,0.0331839993596077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,64,balanced,0.033488000432650246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,64,power_law_1.01,0.04482559859752655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,64,power_law_1.01,0.04573439955711365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,64,power_law_1.2,0.04565120041370392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,64,power_law_1.2,0.04609279930591583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,8,balanced,0.033557333052158356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,8,balanced,0.03554133325815201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,8,power_law_1.01,0.09579520225524903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,8,power_law_1.01,0.09649919867515563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,8,power_law_1.2,0.09356160163879394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,1,8,power_law_1.2,0.0945792019367218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,16,1,balanced,0.027386667827765148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,16,1,balanced,0.02752533306678136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,16,1,power_law_1.01,0.02625280022621155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,16,1,power_law_1.01,0.02630400061607361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,16,1,power_law_1.2,0.02622720003128052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,16,1,power_law_1.2,0.02625280022621155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,2,1,balanced,0.05615466833114624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,2,1,balanced,0.05778133372465769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,2,1,power_law_1.01,0.05430399775505066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,2,1,power_law_1.01,0.05493760108947754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,2,1,power_law_1.2,0.05477759838104248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,2,1,power_law_1.2,0.05532159805297852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,32,1,balanced,0.0271519993742307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,32,1,balanced,0.02752533306678136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,32,1,power_law_1.01,0.025856000185012818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,32,1,power_law_1.01,0.02600319981575012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,32,1,power_law_1.2,0.02568959891796112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,32,1,power_law_1.2,0.026067200303077697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,4,1,balanced,0.03764266769091288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,4,1,balanced,0.038933334251244865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,4,1,power_law_1.01,0.039366400241851805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,4,1,power_law_1.01,0.039705601334571836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,4,1,power_law_1.2,0.03893760144710541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,4,1,power_law_1.2,0.039980798959732056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,8,1,balanced,0.029546665648619335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,8,1,balanced,0.031328000128269196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,8,1,power_law_1.01,0.02800000011920929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,8,1,power_law_1.01,0.028255999088287354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,8,1,power_law_1.2,0.02807680070400238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,3072,1536,8,256,8,1,power_law_1.2,0.028217598795890808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,1,balanced,0.23762667179107666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,1,balanced,0.23811199267705283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,1,power_law_1.01,0.19011199474334717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,1,power_law_1.01,0.2161792039871216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,1,power_law_1.2,0.20166399478912353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,1,power_law_1.2,0.2027199983596802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,2,balanced,0.14751467108726501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,2,balanced,0.15059199929237366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,2,power_law_1.01,0.14763519763946534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,2,power_law_1.01,0.17082879543304444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,2,power_law_1.2,0.13918720483779906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,2,power_law_1.2,0.16328959465026854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,4,balanced,0.11750933527946472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,4,balanced,0.12297067046165466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,4,power_law_1.01,0.13105920553207398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,4,power_law_1.01,0.14082560539245606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,4,power_law_1.2,0.12488960027694702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,4,power_law_1.2,0.13306879997253418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,8,balanced,0.11085333426793416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,8,balanced,0.1150933305422465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,8,power_law_1.01,0.10940159559249878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,8,power_law_1.01,0.1102463960647583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,8,power_law_1.2,0.10844800472259522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,1,8,power_law_1.2,0.11038719415664673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,16,1,balanced,0.03369066615899404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,16,1,balanced,0.035530666510264076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,16,1,power_law_1.01,0.03446399867534637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,16,1,power_law_1.01,0.035078400373458864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,16,1,power_law_1.2,0.03413119912147522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,16,1,power_law_1.2,0.0342848002910614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,2,1,balanced,0.13550933202107748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,2,1,balanced,0.13760000467300415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,2,1,power_law_1.01,0.11354240179061889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,2,1,power_law_1.01,0.12446719408035278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,2,1,power_law_1.2,0.11274880170822144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,2,1,power_law_1.2,0.13181439638137818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,32,1,balanced,0.02916266769170761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,32,1,balanced,0.031290667752424874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,32,1,power_law_1.01,0.028896000981330872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,32,1,power_law_1.01,0.030169600248336793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,32,1,power_law_1.2,0.029529601335525513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,32,1,power_law_1.2,0.029625600576400755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,4,1,balanced,0.08473599950472514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,4,1,balanced,0.09521067142486572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,4,1,power_law_1.01,0.0676479995250702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,4,1,power_law_1.01,0.07134079933166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,4,1,power_law_1.2,0.07514879703521729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,4,1,power_law_1.2,0.07533439993858337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,8,1,balanced,0.05705599983533224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,8,1,balanced,0.06015466650327047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,8,1,power_law_1.01,0.04599039852619171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,8,1,power_law_1.01,0.046777600049972536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,8,1,power_law_1.2,0.04618239998817444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,14336,2,8,8,1,power_law_1.2,0.049344000220298764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,1,balanced,0.12199466427167256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,1,balanced,0.12275200088818868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,1,power_law_1.01,0.11660799980163575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,1,power_law_1.01,0.1170240044593811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,1,power_law_1.2,0.11679359674453735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,1,power_law_1.2,0.11692160367965698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,128,balanced,0.03554133325815201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,128,balanced,0.03571200122435888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,128,power_law_1.01,0.033670398592948916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,128,power_law_1.01,0.03375360071659088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,128,power_law_1.2,0.034329599142074584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,128,power_law_1.2,0.03443840146064758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,16,balanced,0.035205334424972534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,16,balanced,0.03532266616821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,16,power_law_1.01,0.0711296021938324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,16,power_law_1.01,0.0750976026058197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,16,power_law_1.2,0.06885120272636414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,16,power_law_1.2,0.07235199809074402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,2,balanced,0.0788266658782959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,2,balanced,0.08080000181992848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,2,power_law_1.01,0.10565760135650634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,2,power_law_1.01,0.1126207947731018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,2,power_law_1.2,0.10224000215530396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,2,power_law_1.2,0.10484479665756226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,32,balanced,0.0353973334034284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,32,balanced,0.035589332381884255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,32,power_law_1.01,0.052774399518966675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,32,power_law_1.01,0.053414398431777955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,32,power_law_1.2,0.051974397897720334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,32,power_law_1.2,0.05226879715919495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,4,balanced,0.055344000458717346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,4,balanced,0.056090667843818665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,4,power_law_1.01,0.09854080080986023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,4,power_law_1.01,0.09873920083045959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,4,power_law_1.2,0.0832319974899292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,4,power_law_1.2,0.0973695993423462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,64,balanced,0.0355679988861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,64,balanced,0.03569599986076355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,64,power_law_1.01,0.03687039911746979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,64,power_law_1.01,0.037248000502586365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,64,power_law_1.2,0.03678719997406006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,64,power_law_1.2,0.037747201323509214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,8,balanced,0.03782933453718821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,8,balanced,0.03869866579771042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,8,power_law_1.01,0.09717760086059571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,8,power_law_1.01,0.10195200443267823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,8,power_law_1.2,0.07541760206222534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,1,8,power_law_1.2,0.08008959889411926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,16,1,balanced,0.033530667424201965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,16,1,balanced,0.03456533451875051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,16,1,power_law_1.01,0.03457919955253601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,16,1,power_law_1.01,0.034643200039863584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,16,1,power_law_1.2,0.03407360017299652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,16,1,power_law_1.2,0.03445119857788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,2,1,balanced,0.07463466624418895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,2,1,balanced,0.07481066882610321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,2,1,power_law_1.01,0.06839039921760559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,2,1,power_law_1.01,0.0709824025630951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,2,1,power_law_1.2,0.07052800059318542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,2,1,power_law_1.2,0.07121919989585876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,32,1,balanced,0.03329599897066752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,32,1,balanced,0.033674667278925575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,32,1,power_law_1.01,0.03187839984893799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,32,1,power_law_1.01,0.03238399922847748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,32,1,power_law_1.2,0.03172479867935181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,32,1,power_law_1.2,0.0326335996389389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,4,1,balanced,0.04822400212287903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,4,1,balanced,0.04996799925963084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,4,1,power_law_1.01,0.04689280092716217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,4,1,power_law_1.01,0.04716159999370575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,4,1,power_law_1.2,0.04759039878845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,4,1,power_law_1.2,0.04821760058403015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,8,1,balanced,0.03772799919048945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,8,1,balanced,0.038719999293486275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,8,1,power_law_1.01,0.037676799297332766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,8,1,power_law_1.01,0.03827199935913086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,8,1,power_law_1.2,0.03797760009765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,1536,8,128,8,1,power_law_1.2,0.038073599338531494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,1,balanced,0.44869331518809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,1,balanced,0.44954665501912433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,1,power_law_1.01,0.44712319374084475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,1,power_law_1.01,0.44929280281066897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,1,power_law_1.2,0.4462399959564209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,1,power_law_1.2,0.45000319480895995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,128,balanced,0.04021333406368891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,128,balanced,0.041696002086003624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,128,power_law_1.01,0.07171199917793274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,128,power_law_1.01,0.07337599992752075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,128,power_law_1.2,0.07137280106544494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,128,power_law_1.2,0.07156479954719544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,16,balanced,0.07331733405590057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,16,balanced,0.07435200115044911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,16,power_law_1.01,0.3371072053909302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,16,power_law_1.01,0.34076800346374514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,16,power_law_1.2,0.31676158905029295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,16,power_law_1.2,0.32335360050201417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,2,balanced,0.2632853388786316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,2,balanced,0.26657066742579144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,2,power_law_1.01,0.4524864196777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,2,power_law_1.01,0.4547264099121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,2,power_law_1.2,0.3931328058242798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,2,power_law_1.2,0.40198397636413574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,256,balanced,0.04142399877309799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,256,balanced,0.04173333446184794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,256,power_law_1.01,0.054124802350997925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,256,power_law_1.01,0.055308800935745236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,256,power_law_1.2,0.055206400156021115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,256,power_law_1.2,0.055340802669525145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,32,balanced,0.06214933097362518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,32,balanced,0.06518400212128957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,32,power_law_1.01,0.1967039942741394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,32,power_law_1.01,0.19763200283050536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,32,power_law_1.2,0.19633280038833617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,32,power_law_1.2,0.19912960529327392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,4,balanced,0.15842666228612265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,4,balanced,0.16076800227165222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,4,power_law_1.01,0.4447296142578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,4,power_law_1.01,0.45369601249694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,4,power_law_1.2,0.3395071983337402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,4,power_law_1.2,0.3891455888748169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,64,balanced,0.05745600163936615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,64,balanced,0.059392000238100685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,64,power_law_1.01,0.11923199892044067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,64,power_law_1.01,0.11931519508361817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,64,power_law_1.2,0.11875840425491332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,64,power_law_1.2,0.12151679992675782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,8,balanced,0.1132480005423228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,8,balanced,0.11424533526102702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,8,power_law_1.01,0.444320011138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,8,power_law_1.01,0.45169920921325685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,8,power_law_1.2,0.304256010055542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,1,8,power_law_1.2,0.3206016063690186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,16,1,balanced,0.13157332936922708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,16,1,balanced,0.1323253313700358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,16,1,power_law_1.01,0.13038079738616942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,16,1,power_law_1.01,0.13201279640197755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,16,1,power_law_1.2,0.12975360155105592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,16,1,power_law_1.2,0.1313920021057129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,2,1,balanced,0.24316799640655518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,2,1,balanced,0.24452267090479532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,2,1,power_law_1.01,0.24145278930664063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,2,1,power_law_1.01,0.24449920654296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,2,1,power_law_1.2,0.2415424108505249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,2,1,power_law_1.2,0.24494080543518065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,32,1,balanced,0.101583997408549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,32,1,balanced,0.10222933689753215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,32,1,power_law_1.01,0.09390079975128174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,32,1,power_law_1.01,0.0964352011680603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,32,1,power_law_1.2,0.10039680004119873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,32,1,power_law_1.2,0.10087679624557495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,4,1,balanced,0.15064533551534018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,4,1,balanced,0.15179199973742166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,4,1,power_law_1.01,0.1463487982749939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,4,1,power_law_1.01,0.1475775957107544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,4,1,power_law_1.2,0.14911999702453613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,4,1,power_law_1.2,0.15088640451431273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,8,1,balanced,0.09867200255393982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,8,1,balanced,0.09977066516876221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,8,1,power_law_1.01,0.09638400077819824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,8,1,power_law_1.01,0.09953920245170593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,8,1,power_law_1.2,0.09741439819335937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,4096,2688,22,512,8,1,power_law_1.2,0.09883520007133484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,1,balanced,0.36979198455810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,1,balanced,0.38839999834696454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,1,power_law_1.01,0.33644158840179444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,1,power_law_1.01,0.36099839210510254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,1,power_law_1.2,0.2978559970855713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,1,power_law_1.2,0.3332672119140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,2,balanced,0.22551467021306357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,2,balanced,0.26681600014368695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,2,power_law_1.01,0.22393600940704345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,2,power_law_1.01,0.25418241024017335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,2,power_law_1.2,0.2607295989990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,2,power_law_1.2,0.29109759330749513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,4,balanced,0.15191466609636942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,4,balanced,0.1547040045261383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,4,power_law_1.01,0.17800320386886598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,4,power_law_1.01,0.19459199905395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,4,power_law_1.2,0.16599040031433104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,4,power_law_1.2,0.187391996383667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,8,balanced,0.15084266662597656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,8,balanced,0.1535253326098124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,8,power_law_1.01,0.14728959798812866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,8,power_law_1.01,0.14959360361099244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,8,power_law_1.2,0.1497215986251831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,1,8,power_law_1.2,0.1522752046585083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,16,1,balanced,0.04786133269468943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,16,1,balanced,0.04844800134499868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,16,1,power_law_1.01,0.04445439875125885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,16,1,power_law_1.01,0.04521600008010864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,16,1,power_law_1.2,0.045561599731445315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,16,1,power_law_1.2,0.046316799521446225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,2,1,balanced,0.2129546602567037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,2,1,balanced,0.2378773291905721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,2,1,power_law_1.01,0.1785215973854065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,2,1,power_law_1.01,0.18891520500183107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,2,1,power_law_1.2,0.17070080041885377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,2,1,power_law_1.2,0.19491200447082518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,32,1,balanced,0.039408000806967415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,32,1,balanced,0.03946666667858759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,32,1,power_law_1.01,0.03868800103664398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,32,1,power_law_1.01,0.039238399267196654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,32,1,power_law_1.2,0.03950720131397247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,32,1,power_law_1.2,0.04035199880599975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,4,1,balanced,0.12443733215332031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,4,1,balanced,0.1399999956289927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,4,1,power_law_1.01,0.09907199740409851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,4,1,power_law_1.01,0.1068160057067871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,4,1,power_law_1.2,0.11264640092849731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,4,1,power_law_1.2,0.11665920019149781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,8,1,balanced,0.07000533243020375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,8,1,balanced,0.07493866483370464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,8,1,power_law_1.01,0.05958399772644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,8,1,power_law_1.01,0.06289280056953431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,8,1,power_law_1.2,0.06550400257110596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,16384,2,8,8,1,power_law_1.2,0.06869120001792908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,1,balanced,0.2106399933497111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,1,balanced,0.24833067258199057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,1,power_law_1.01,0.20904319286346434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,1,power_law_1.01,0.21004800796508788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,1,power_law_1.2,0.20908799171447753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,1,power_law_1.2,0.2095871925354004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,128,balanced,0.043194666504859924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,128,balanced,0.043509334325790405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,128,power_law_1.01,0.05857920050621033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,128,power_law_1.01,0.05864319801330566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,128,power_law_1.2,0.05804160237312317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,128,power_law_1.2,0.05813760161399841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,16,balanced,0.0417546679576238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,16,balanced,0.04359466830889384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,16,power_law_1.01,0.2162623882293701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,16,power_law_1.01,0.21697919368743895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,16,power_law_1.2,0.20758399963378907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,16,power_law_1.2,0.2162303924560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,2,balanced,0.1340000033378601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,2,balanced,0.13698666294415793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,2,power_law_1.01,0.21587839126586914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,2,power_law_1.01,0.21667840480804443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,2,power_law_1.2,0.2126528024673462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,2,power_law_1.2,0.21722240447998048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,256,balanced,0.0421066681543986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,256,balanced,0.04374399781227112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,256,power_law_1.01,0.04079999923706055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,256,power_law_1.01,0.04097920060157776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,256,power_law_1.2,0.04049279987812042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,256,power_law_1.2,0.0406464010477066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,32,balanced,0.042650664846102394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,32,balanced,0.04377066592375437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,32,power_law_1.01,0.1307263970375061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,32,power_law_1.01,0.13430399894714357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,32,power_law_1.2,0.13024640083312988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,32,power_law_1.2,0.13185919523239137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,4,balanced,0.07493866483370464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,4,balanced,0.07648000121116638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,4,power_law_1.01,0.21738879680633544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,4,power_law_1.01,0.2219327926635742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,4,power_law_1.2,0.21541121006011962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,4,power_law_1.2,0.216646409034729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,64,balanced,0.04377066592375437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,64,balanced,0.04381866753101349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,64,power_law_1.01,0.07381119728088378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,64,power_law_1.01,0.07442560195922851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,64,power_law_1.2,0.07423999905586243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,64,power_law_1.2,0.0753216028213501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,8,balanced,0.06010666489601135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,8,balanced,0.06019733349482218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,8,power_law_1.01,0.21546878814697265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,8,power_law_1.01,0.21666560173034669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,8,power_law_1.2,0.20378880500793456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,1,8,power_law_1.2,0.21646718978881835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,16,1,balanced,0.04357333481311798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,16,1,balanced,0.0462719996770223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,16,1,power_law_1.01,0.040140798687934874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,16,1,power_law_1.01,0.04039680063724518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,16,1,power_law_1.2,0.040524798631668094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,16,1,power_law_1.2,0.04392960071563721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,2,1,balanced,0.13149333000183105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,2,1,balanced,0.13176533579826355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,2,1,power_law_1.01,0.13004159927368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,2,1,power_law_1.01,0.13441920280456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,2,1,power_law_1.2,0.12661759853363036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,2,1,power_law_1.2,0.1307136058807373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,32,1,balanced,0.04051200052102407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,32,1,balanced,0.04148799926042557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,32,1,power_law_1.01,0.03963519930839539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,32,1,power_law_1.01,0.03976320028305054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,32,1,power_law_1.2,0.03928320109844208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,32,1,power_law_1.2,0.03997440040111542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,4,1,balanced,0.07253333429495494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,4,1,balanced,0.07338666419188182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,4,1,power_law_1.01,0.0711679995059967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,4,1,power_law_1.01,0.07825919985771179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,4,1,power_law_1.2,0.07155200242996215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,4,1,power_law_1.2,0.07207679748535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,8,1,balanced,0.051967998345692955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,8,1,balanced,0.052383999029795326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,8,1,power_law_1.01,0.050432002544403075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,8,1,power_law_1.01,0.052339202165603636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,8,1,power_law_1.2,0.050400000810623166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2048,8,256,8,1,power_law_1.2,0.05070719718933105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,1,balanced,0.24080532789230347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,1,balanced,0.24226667483647665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,1,power_law_1.01,0.23911681175231933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,1,power_law_1.01,0.24085760116577148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,1,power_law_1.2,0.24031360149383546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,1,power_law_1.2,0.24821119308471679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,16,balanced,0.045994664231936135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,16,balanced,0.04778666794300079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,16,power_law_1.01,0.17045120000839234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,16,power_law_1.01,0.17216639518737792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,16,power_law_1.2,0.15936000347137452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,16,power_law_1.2,0.1627392053604126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,2,balanced,0.14662399888038635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,2,balanced,0.14816000064214072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,2,power_law_1.01,0.22621440887451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,2,power_law_1.01,0.23299839496612548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,2,power_law_1.2,0.2017728090286255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,2,power_law_1.2,0.20882558822631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,32,balanced,0.04781866570313772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,32,balanced,0.04926399886608124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,32,power_law_1.01,0.10316159725189208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,32,power_law_1.01,0.10444799661636353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,32,power_law_1.2,0.10231679677963257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,32,power_law_1.2,0.10301439762115479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,4,balanced,0.0844640036424001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,4,balanced,0.0851093331972758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,4,power_law_1.01,0.22926080226898193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,4,power_law_1.01,0.2412287950515747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,4,power_law_1.2,0.17859840393066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,4,power_law_1.2,0.19001599550247192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,8,balanced,0.06195733447869619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,8,balanced,0.06389866769313812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,8,power_law_1.01,0.21042559146881104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,8,power_law_1.01,0.2198784112930298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,8,power_law_1.2,0.15688960552215575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,1,8,power_law_1.2,0.18439040184020997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,16,1,balanced,0.049413333336512245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,16,1,balanced,0.04987733562787374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,16,1,power_law_1.01,0.04767360091209412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,16,1,power_law_1.01,0.048198398947715757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,16,1,power_law_1.2,0.04787839949131012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,2,1,balanced,0.14273599783579508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,2,1,balanced,0.14392000436782837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,2,1,power_law_1.01,0.14110080003738404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,2,1,power_law_1.01,0.1419584035873413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,2,1,power_law_1.2,0.14477440118789672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,2,1,power_law_1.2,0.14538880586624145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,32,1,balanced,0.041706666350364685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,32,1,balanced,0.04188266893227895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,32,1,power_law_1.01,0.04022400081157684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,32,1,power_law_1.01,0.04170239865779877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,32,1,power_law_1.2,0.04217599928379059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,32,1,power_law_1.2,0.043647998571395875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,4,1,balanced,0.0860693355401357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,4,1,balanced,0.0918239951133728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,4,1,power_law_1.01,0.08115199804306031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,4,1,power_law_1.01,0.08287360072135926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,4,1,power_law_1.2,0.08019199967384338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,4,1,power_law_1.2,0.08196480274200439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,8,1,balanced,0.05899199843406677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,8,1,balanced,0.06003733476003011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,8,1,power_law_1.01,0.058336001634597776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,8,1,power_law_1.01,0.05886080265045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,8,1,power_law_1.2,0.058387202024459836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,6144,2560,8,160,8,1,power_law_1.2,0.06166399717330932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,1,balanced,0.24012800057729086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,1,balanced,0.24122132857640585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,1,power_law_1.01,0.23905279636383056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,1,power_law_1.01,0.23967359066009522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,1,power_law_1.2,0.23845760822296141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,1,power_law_1.2,0.23921279907226561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,128,balanced,0.049653331438700356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,128,balanced,0.04965866605440775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,128,power_law_1.01,0.06343680024147033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,128,power_law_1.01,0.0637440025806427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,128,power_law_1.2,0.06272000074386597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,128,power_law_1.2,0.06309760212898255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,16,balanced,0.05020800232887268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,16,balanced,0.05167999863624573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,16,power_law_1.01,0.24684159755706786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,16,power_law_1.01,0.24749441146850587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,16,power_law_1.2,0.2319103956222534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,16,power_law_1.2,0.23576960563659669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,2,balanced,0.1554080049196879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,2,balanced,0.15690666437149048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,2,power_law_1.01,0.2444159984588623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,2,power_law_1.01,0.24471039772033693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,2,power_law_1.2,0.23678719997406006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,2,power_law_1.2,0.24567680358886718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,256,balanced,0.049029335379600525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,256,balanced,0.04977599779764811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,256,power_law_1.01,0.04832639992237091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,256,power_law_1.01,0.048563200235366824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,256,power_law_1.2,0.0483711987733841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,256,power_law_1.2,0.05067520141601563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,32,balanced,0.05009066561857859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,32,balanced,0.051685333251953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,32,power_law_1.01,0.15186560153961182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,32,power_law_1.2,0.15413119792938232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,32,power_law_1.2,0.15492479801177977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,4,balanced,0.08970666925112407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,4,balanced,0.0906880001227061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,4,power_law_1.01,0.24712319374084474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,4,power_law_1.01,0.24817280769348143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,4,power_law_1.2,0.23793280124664307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,4,power_law_1.2,0.24975359439849854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,64,balanced,0.04974933465321859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,64,balanced,0.05002133548259735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,64,power_law_1.01,0.08630399703979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,64,power_law_1.01,0.08940799832344055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,64,power_law_1.2,0.08621439933776856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,64,power_law_1.2,0.08625280261039733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,8,balanced,0.06595199803511302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,8,balanced,0.07706666489442189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,8,power_law_1.01,0.24445440769195556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,8,power_law_1.01,0.24651520252227782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,8,power_law_1.2,0.2457792043685913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,1,8,power_law_1.2,0.24638080596923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,16,1,balanced,0.0498879998922348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,16,1,balanced,0.05106133222579956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,16,1,power_law_1.01,0.045465600490570066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,16,1,power_law_1.01,0.04789760112762451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,16,1,power_law_1.2,0.04775680005550385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,16,1,power_law_1.2,0.048518401384353635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,2,1,balanced,0.14717866977055868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,2,1,balanced,0.15705600380897522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,2,1,power_law_1.01,0.15590399503707886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,2,1,power_law_1.01,0.18364800214767457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,2,1,power_law_1.2,0.14236799478530884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,2,1,power_law_1.2,0.14956159591674806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,32,1,balanced,0.04589866598447164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,32,1,balanced,0.04595200220743815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,32,1,power_law_1.01,0.04418559968471527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,32,1,power_law_1.01,0.04440320134162903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,32,1,power_law_1.2,0.044268798828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,32,1,power_law_1.2,0.04454399943351746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,4,1,balanced,0.08098666866620381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,4,1,balanced,0.08776000142097473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,4,1,power_law_1.01,0.07870720028877258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,4,1,power_law_1.01,0.08004480004310607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,4,1,power_law_1.2,0.07917439937591553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,4,1,power_law_1.2,0.07953919768333435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,8,1,balanced,0.05801600217819214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,8,1,balanced,0.058117335041364036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,8,1,power_law_1.01,0.059001600742340087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,8,1,power_law_1.01,0.06331520080566407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,8,1,power_law_1.2,0.0561024010181427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,256,8,1,power_law_1.2,0.05617920160293579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,1,balanced,0.2419360081354777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,1,balanced,0.2426933248837789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,1,power_law_1.01,0.23804159164428712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,1,power_law_1.01,0.23815679550170898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,1,power_law_1.2,0.23816959857940673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,1,power_law_1.2,0.24079999923706055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,128,balanced,0.04970133304595947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,128,balanced,0.05000533163547516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,128,power_law_1.01,0.06944640278816223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,128,power_law_1.01,0.06948480010032654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,128,power_law_1.2,0.06963199973106385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,128,power_law_1.2,0.0706816017627716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,16,balanced,0.050000001986821495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,16,balanced,0.05003199974695841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,16,power_law_1.01,0.24700798988342285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,16,power_law_1.01,0.24917759895324706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,16,power_law_1.2,0.24627199172973632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,16,power_law_1.2,0.24744319915771484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,2,balanced,0.15281599760055542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,2,balanced,0.17822933197021484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,2,power_law_1.01,0.24728960990905763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,2,power_law_1.01,0.24987521171569824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,2,power_law_1.2,0.2479935884475708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,2,power_law_1.2,0.25543038845062255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,32,balanced,0.0499893327554067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,32,balanced,0.05008000135421753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,32,power_law_1.01,0.18419840335845947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,32,power_law_1.01,0.18422399759292601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,32,power_law_1.2,0.18344320058822633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,32,power_law_1.2,0.18347519636154175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,4,balanced,0.0888426701227824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,4,balanced,0.08948799967765808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,4,power_law_1.01,0.24412798881530762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,4,power_law_1.01,0.24654080867767333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,4,power_law_1.2,0.24564480781555176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,4,power_law_1.2,0.24737279415130614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,64,balanced,0.05061866839726766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,64,balanced,0.05197866757710775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,64,power_law_1.01,0.1056447982788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,64,power_law_1.01,0.10725120306015015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,64,power_law_1.2,0.10614399909973145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,64,power_law_1.2,0.10722559690475464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,8,balanced,0.06435200075308482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,8,balanced,0.06539200246334076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,8,power_law_1.01,0.24677760601043702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,8,power_law_1.01,0.24732160568237305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,8,power_law_1.2,0.2465536117553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,1,8,power_law_1.2,0.24724481105804444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,16,1,balanced,0.050026665131251015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,16,1,balanced,0.051642666260401406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,16,1,power_law_1.01,0.046489599347114566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,16,1,power_law_1.01,0.04753279983997345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,16,1,power_law_1.2,0.047193598747253415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,16,1,power_law_1.2,0.047660800814628604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,2,1,balanced,0.1452906628449758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,2,1,balanced,0.1509866714477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,2,1,power_law_1.01,0.14351999759674072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,2,1,power_law_1.01,0.14687999486923217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,2,1,power_law_1.2,0.1483456015586853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,2,1,power_law_1.2,0.14840320348739625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,32,1,balanced,0.045567999283472695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,32,1,balanced,0.047509332497914634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,32,1,power_law_1.01,0.04447360038757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,32,1,power_law_1.01,0.04481280148029328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,32,1,power_law_1.2,0.04430719912052154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,32,1,power_law_1.2,0.044588801264762876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,4,1,balanced,0.0798773318529129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,4,1,balanced,0.085807998975118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,4,1,power_law_1.01,0.07874559760093688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,4,1,power_law_1.01,0.07909119725227357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,4,1,power_law_1.2,0.0785215973854065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,4,1,power_law_1.2,0.0789247989654541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,8,1,balanced,0.05779199798901876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,8,1,balanced,0.05806933343410492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,8,1,power_law_1.01,0.05607039928436279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,8,1,power_law_1.01,0.05656319856643677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,8,1,power_law_1.2,0.05594879984855652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2,7168,2048,8,384,8,1,power_law_1.2,0.05601919889450073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,1,balanced,0.34832000732421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,1,balanced,0.3543519973754883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,1,power_law_1.01,0.4033792018890381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,1,power_law_1.01,0.41018238067626955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,1,power_law_1.2,0.4219967842102051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,1,power_law_1.2,0.42213759422302244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,128,balanced,0.13009599844614664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,128,balanced,0.13040533661842346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,128,power_law_1.01,0.13494399785995484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,128,power_law_1.01,0.13574399948120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,128,power_law_1.2,0.14191999435424804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,128,power_law_1.2,0.14343680143356324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,16,balanced,0.1418826679388682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,16,balanced,0.14221333463986716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,16,power_law_1.01,0.16371840238571167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,16,power_law_1.01,0.16684160232543946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,16,power_law_1.2,0.16784000396728516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,16,power_law_1.2,0.16794240474700928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,2,balanced,0.2531893253326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,2,balanced,0.25723199049631756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,2,power_law_1.01,0.3105407953262329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,2,power_law_1.01,0.31129601001739504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,2,power_law_1.2,0.3138240098953247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,2,power_law_1.2,0.32709760665893556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,32,balanced,0.13454932967821756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,32,balanced,0.1357919971148173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,32,power_law_1.01,0.14425599575042725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,32,power_law_1.01,0.14568320512771607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,32,power_law_1.2,0.15134079456329347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,32,power_law_1.2,0.15534720420837403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,4,balanced,0.1930239995320638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,4,balanced,0.19498133659362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,4,power_law_1.01,0.22604799270629883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,4,power_law_1.01,0.22821760177612305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,4,power_law_1.2,0.22987520694732666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,4,power_law_1.2,0.23104639053344728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,64,balanced,0.1316373348236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,64,balanced,0.13354133566220602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,64,power_law_1.01,0.1394047975540161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,64,power_law_1.01,0.14112639427185059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,64,power_law_1.2,0.14504319429397583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,64,power_law_1.2,0.14840320348739625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,8,balanced,0.1605226695537567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,8,balanced,0.16098666191101074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,8,power_law_1.01,0.18703999519348144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,8,power_law_1.01,0.1892351984977722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,8,power_law_1.2,0.1869312047958374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,1,8,power_law_1.2,0.18978559970855713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,2,1,balanced,0.22526933749516806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,2,1,balanced,0.2259999910990397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,2,1,power_law_1.01,0.2764672040939331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,2,1,power_law_1.01,0.2769984006881714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,2,1,power_law_1.2,0.2803263902664185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,2,1,power_law_1.2,0.28129279613494873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,4,1,balanced,0.171999990940094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,4,1,balanced,0.17215466499328613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,4,1,power_law_1.01,0.20458879470825195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,4,1,power_law_1.01,0.20492160320281982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,4,1,power_law_1.2,0.20615038871765137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2048,768,8,128,4,1,power_law_1.2,0.20682239532470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,1,balanced,0.8195839722951254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,1,balanced,0.8311466375986735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,1,power_law_1.01,0.9415679931640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,1,power_law_1.01,0.9610560417175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,1,power_law_1.2,0.9626560211181641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,1,power_law_1.2,0.9785152435302734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,128,balanced,0.16922134160995483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,128,balanced,0.17004267374674478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,128,power_law_1.01,0.18376319408416747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,128,power_law_1.01,0.18635519742965698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,128,power_law_1.2,0.20245120525360108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,128,power_law_1.2,0.20527999401092528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,16,balanced,0.2116426626841227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,16,balanced,0.21182932456334433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,16,power_law_1.01,0.24615681171417236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,16,power_law_1.01,0.25233919620513917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,16,power_law_1.2,0.2610879898071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,16,power_law_1.2,0.26127359867095945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,2,balanced,0.5261546770731608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,2,balanced,0.5298080046971639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,2,power_law_1.01,0.6314303874969482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,2,power_law_1.01,0.6337024211883545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,2,power_law_1.2,0.6315328121185303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,2,power_law_1.2,0.6509952068328857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,32,balanced,0.18889600038528442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,32,balanced,0.18925867478052774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,32,power_law_1.01,0.2202239990234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,32,power_law_1.01,0.22104959487915038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,32,power_law_1.2,0.22923519611358642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,32,power_law_1.2,0.23075199127197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,4,balanced,0.35546668370564777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,4,balanced,0.35717864831288654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,4,power_law_1.01,0.4144256114959717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,4,power_law_1.01,0.4178431987762451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,4,power_law_1.2,0.41742720603942873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,4,power_law_1.2,0.4287680149078369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,64,balanced,0.1747573415438334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,64,balanced,0.1750453313191732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,64,power_law_1.01,0.19710079431533814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,64,power_law_1.01,0.19831680059432982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,64,power_law_1.2,0.21458559036254882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,64,power_law_1.2,0.21552000045776368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,8,balanced,0.26234134038289386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,8,balanced,0.26472000281016034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,8,power_law_1.01,0.30935680866241455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,8,power_law_1.01,0.30951039791107177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,8,power_law_1.2,0.32312960624694825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,1,8,power_law_1.2,0.32911999225616456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,16,1,balanced,0.3142346739768982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,16,1,balanced,0.31513599554697674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,16,1,power_law_1.01,0.4059648036956787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,16,1,power_law_1.01,0.4089983940124512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,16,1,power_law_1.2,0.41784958839416503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,16,1,power_law_1.2,0.4182271957397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,2,1,balanced,0.49245866139729816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,2,1,balanced,0.4927146832148234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,2,1,power_law_1.01,0.5833536148071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,2,1,power_law_1.01,0.5886784076690674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,2,1,power_law_1.2,0.6016767978668213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,2,1,power_law_1.2,0.6040512084960937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,32,1,balanced,0.25813867648442584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,32,1,balanced,0.25890133778254193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,32,1,power_law_1.01,0.33965439796447755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,32,1,power_law_1.01,0.33973119258880613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,32,1,power_law_1.2,0.34897279739379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,32,1,power_law_1.2,0.35053439140319825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,4,1,balanced,0.31247466802597046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,4,1,balanced,0.31353066364924115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,4,1,power_law_1.01,0.3694400072097778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,4,1,power_law_1.01,0.3745151996612549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,4,1,power_law_1.2,0.37966079711914064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,4,1,power_law_1.2,0.3830080032348633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,8,1,balanced,0.40863998730977374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,8,1,balanced,0.4096693197886149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,8,1,power_law_1.01,0.5176127910614013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,8,1,power_law_1.01,0.525593614578247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,8,1,power_law_1.2,0.5362304210662842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,2688,1856,6,128,8,1,power_law_1.2,0.5371967792510987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,1,balanced,1.526576042175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,1,balanced,1.5367786089579265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,1,power_law_1.01,1.613203239440918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,1,power_law_1.01,1.6159360885620118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,1,power_law_1.2,1.6732032775878907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,1,power_law_1.2,1.701420783996582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,128,balanced,0.22977600495020548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,128,balanced,0.23113600413004556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,128,power_law_1.01,0.2399679899215698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,128,power_law_1.01,0.2436288118362427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,128,power_law_1.2,0.2503040075302124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,128,power_law_1.2,0.2534271955490112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,16,balanced,0.30483200152715045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,16,balanced,0.30502933263778687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,16,power_law_1.01,0.33086719512939455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,16,power_law_1.01,0.33804800510406496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,16,power_law_1.2,0.3450047969818115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,16,power_law_1.2,0.34524800777435305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,2,balanced,0.8699999650319418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,2,balanced,0.8726452986399332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,2,power_law_1.01,0.9417856216430665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,2,power_law_1.01,0.9492671966552735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,2,power_law_1.2,0.9738816261291504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,2,power_law_1.2,0.980735969543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,256,balanced,0.22660799821217856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,256,balanced,0.2280693252881368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,256,power_law_1.01,0.2352384090423584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,256,power_law_1.01,0.2356031894683838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,256,power_law_1.2,0.244979190826416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,256,power_law_1.2,0.2475584030151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,32,balanced,0.2585279941558838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,32,balanced,0.2595679958661397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,32,power_law_1.01,0.28096001148223876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,32,power_law_1.01,0.2830336093902588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,32,power_law_1.2,0.2910527944564819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,32,power_law_1.2,0.29823999404907225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,4,balanced,0.5525333484013876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,4,balanced,0.5532106558481852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,4,power_law_1.01,0.5983551979064942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,4,power_law_1.01,0.6207168102264404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,4,power_law_1.2,0.603334379196167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,4,power_law_1.2,0.616051197052002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,64,balanced,0.23824532826741537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,64,balanced,0.23825067281723022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,64,power_law_1.01,0.25474560260772705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,64,power_law_1.01,0.2586944103240967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,64,power_law_1.2,0.26519041061401366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,64,power_law_1.2,0.27491838932037355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,8,balanced,0.38731201489766437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,8,balanced,0.3874826828638713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,8,power_law_1.01,0.42011518478393556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,8,power_law_1.01,0.4282559871673584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,8,power_law_1.2,0.44313597679138184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,1,8,power_law_1.2,0.44858241081237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,16,1,balanced,0.2717866698900859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,16,1,balanced,0.273418664932251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,16,1,power_law_1.01,0.3091327905654907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,16,1,power_law_1.01,0.3093055963516235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,16,1,power_law_1.2,0.31587839126586914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,16,1,power_law_1.2,0.3185920000076294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,2,1,balanced,0.8330826759338379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,2,1,balanced,0.8333973089853922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,2,1,power_law_1.01,0.8909055709838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,2,1,power_law_1.01,0.8949952125549316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,2,1,power_law_1.2,0.9321855545043946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,2,1,power_law_1.2,0.940556812286377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,32,1,balanced,0.22197866439819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,32,1,balanced,0.22394667069117227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,32,1,power_law_1.01,0.25770881175994875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,32,1,power_law_1.01,0.25829119682312013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,32,1,power_law_1.2,0.2636607885360718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,32,1,power_law_1.2,0.2645632028579712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,4,1,balanced,0.5034613211949667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,4,1,balanced,0.5034826596577963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,4,1,power_law_1.01,0.5396927833557129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,4,1,power_law_1.01,0.5465023994445801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,4,1,power_law_1.2,0.5537792205810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,4,1,power_law_1.2,0.5567232131958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,8,1,balanced,0.3391306797663371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,8,1,balanced,0.3403253157933553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,8,1,power_law_1.01,0.37521278858184814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,8,1,power_law_1.01,0.37637760639190676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,8,1,power_law_1.2,0.3825792074203491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,3072,1536,8,256,8,1,power_law_1.2,0.38330879211425783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,1,balanced,1.7135200500488281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,1,balanced,1.7263092994689941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,1,power_law_1.01,1.8904064178466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,1,power_law_1.01,1.9027839660644532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,1,power_law_1.2,1.8993152618408202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,1,power_law_1.2,1.9320192337036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,2,balanced,0.9794293244679769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,2,balanced,0.9843200047810873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,2,power_law_1.01,1.3369088172912598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,2,power_law_1.01,1.3421631813049317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,2,power_law_1.2,1.3773568153381348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,2,power_law_1.2,1.5757247924804687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,4,balanced,0.5962133407592773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,4,balanced,0.5973493258158366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,4,power_law_1.01,1.0076671600341798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,4,power_law_1.01,1.0115327835083008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,4,power_law_1.2,0.9811264038085937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,4,power_law_1.2,1.0561087608337403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,8,balanced,0.46650667985280353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,8,balanced,0.4681226809819539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,8,power_law_1.01,0.8577407836914063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,8,power_law_1.01,0.8725184440612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,8,power_law_1.2,0.8736448287963867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,1,8,power_law_1.2,0.8914688110351563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,16,1,balanced,0.17087999979654947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,16,1,balanced,0.17099199692408243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,16,1,power_law_1.01,0.1798143982887268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,16,1,power_law_1.01,0.17991679906845093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,16,1,power_law_1.2,0.17723519802093507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,16,1,power_law_1.2,0.17791359424591063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,2,1,balanced,0.8829066753387451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,2,1,balanced,0.8929119904836019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,2,1,power_law_1.01,0.9537152290344239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,2,1,power_law_1.01,0.961894416809082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,2,1,power_law_1.2,0.952121639251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,2,1,power_law_1.2,0.9585727691650391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,32,1,balanced,0.11338133613268535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,32,1,balanced,0.11539733409881592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,32,1,power_law_1.01,0.12077440023422241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,32,1,power_law_1.01,0.1211840033531189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,32,1,power_law_1.2,0.12003200054168701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,32,1,power_law_1.2,0.12031359672546386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,4,1,balanced,0.474181334177653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,4,1,balanced,0.4752693176269531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,4,1,power_law_1.01,0.5081088066101074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,4,1,power_law_1.01,0.5153855800628662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,4,1,power_law_1.2,0.5003327846527099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,4,1,power_law_1.2,0.5157695770263672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,8,1,balanced,0.2799573342005412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,8,1,balanced,0.28034132719039917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,8,1,power_law_1.01,0.28574719429016116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,8,1,power_law_1.01,0.2865664005279541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,8,1,power_law_1.2,0.286681604385376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,14336,2,8,8,1,power_law_1.2,0.2880000114440918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,1,balanced,1.1013333002726238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,1,balanced,1.1056586901346843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,1,power_law_1.01,1.4332544326782226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,1,power_law_1.01,1.434995174407959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,1,power_law_1.2,1.461855983734131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,1,power_law_1.2,1.4866175651550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,128,balanced,0.2276159922281901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,128,balanced,0.22778666019439697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,128,power_law_1.01,0.25473918914794924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,128,power_law_1.01,0.25861120223999023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,128,power_law_1.2,0.2728640079498291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,128,power_law_1.2,0.27730560302734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,16,balanced,0.2680906653404236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,16,balanced,0.2701333363850911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,16,power_law_1.01,0.3338239908218384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,16,power_law_1.01,0.3387200117111206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,16,power_law_1.2,0.3522432088851929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,16,power_law_1.2,0.36659200191497804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,2,balanced,0.6777119636535645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,2,balanced,0.6782879829406738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,2,power_law_1.01,0.8585280418395996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,2,power_law_1.01,0.8816448211669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,2,power_law_1.2,0.876153564453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,2,power_law_1.2,0.9074175834655762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,32,balanced,0.24020800987879434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,32,balanced,0.2408533294995626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,32,power_law_1.01,0.2875328063964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,32,power_law_1.01,0.297760009765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,32,power_law_1.2,0.3075648069381714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,32,power_law_1.2,0.3158207893371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,4,balanced,0.4399413267771403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,4,balanced,0.44121599197387695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,4,power_law_1.01,0.5660096168518066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,4,power_law_1.01,0.5671487808227539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,4,power_law_1.2,0.5684415817260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,4,power_law_1.2,0.5806655883789062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,64,balanced,0.23047999540964761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,64,balanced,0.23169066508611044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,64,power_law_1.01,0.2658047914505005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,64,power_law_1.01,0.2707135915756226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,64,power_law_1.2,0.28758399486541747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,64,power_law_1.2,0.30261759757995604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,8,balanced,0.32874133189519245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,8,balanced,0.3299413323402405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,8,power_law_1.01,0.41069440841674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,8,power_law_1.01,0.41863040924072265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,8,power_law_1.2,0.422438383102417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,1,8,power_law_1.2,0.4449471950531006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,16,1,balanced,0.23570134242375693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,16,1,balanced,0.23583465814590454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,16,1,power_law_1.01,0.29747838973999025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,16,1,power_law_1.01,0.29821441173553465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,16,1,power_law_1.2,0.29959681034088137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,16,1,power_law_1.2,0.30071680545806884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,2,1,balanced,0.6149280071258545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,2,1,balanced,0.6205120086669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,2,1,power_law_1.01,0.7298687934875489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,2,1,power_law_1.01,0.735206413269043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,2,1,power_law_1.2,0.7565248012542725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,2,1,power_law_1.2,0.7640063762664795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,32,1,balanced,0.21549866596857706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,32,1,balanced,0.2155146598815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,32,1,power_law_1.01,0.24414079189300536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,32,1,power_law_1.01,0.24456961154937745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,32,1,power_law_1.2,0.2460927963256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,32,1,power_law_1.2,0.2462399959564209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,4,1,balanced,0.3935733238855998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,4,1,balanced,0.39500800768534344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,4,1,power_law_1.01,0.4979392051696777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,4,1,power_law_1.01,0.4979712009429932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,4,1,power_law_1.2,0.5008255958557128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,4,1,power_law_1.2,0.5028031826019287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,8,1,balanced,0.2972746690114339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,8,1,balanced,0.2980960011482239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,8,1,power_law_1.01,0.35904641151428224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,8,1,power_law_1.01,0.3609855890274048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,8,1,power_law_1.2,0.36135039329528806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,1536,8,128,8,1,power_law_1.2,0.36387200355529786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,1,balanced,7.166090647379558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,1,balanced,7.264154434204102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,1,power_law_1.01,8.978163146972657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,1,power_law_1.01,9.173343658447266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,1,power_law_1.2,9.207283020019531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,1,power_law_1.2,9.327603149414063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,128,balanced,0.8152000109354655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,128,balanced,0.8170506954193115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,128,power_law_1.01,0.892147159576416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,128,power_law_1.01,0.8933952331542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,128,power_law_1.2,0.9101759910583496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,128,power_law_1.2,0.9197183609008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,16,balanced,1.1485599676767986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,16,balanced,1.1521813074747722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,16,power_law_1.01,1.318835163116455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,16,power_law_1.01,1.3310720443725585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,16,power_law_1.2,1.3782912254333497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,16,power_law_1.2,1.387993621826172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,2,balanced,3.9350932439168296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,2,balanced,4.148912111918132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,2,power_law_1.01,4.873222351074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,2,power_law_1.01,4.882963180541992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,2,power_law_1.2,4.898950576782227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,2,power_law_1.2,5.208569717407227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,256,balanced,0.7974507013956705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,256,balanced,0.7981226444244385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,256,power_law_1.01,0.8525888442993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,256,power_law_1.01,0.8576128005981445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,256,power_law_1.2,0.880339241027832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,256,power_law_1.2,0.884825611114502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,32,balanced,0.9654293060302734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,32,balanced,0.9658026695251465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,32,power_law_1.01,1.0793024063110352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,32,power_law_1.01,1.087712001800537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,32,power_law_1.2,1.1178879737854004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,32,power_law_1.2,1.1248127937316894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,4,balanced,2.3023200035095215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,4,balanced,2.3187360763549805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,4,power_law_1.01,2.7435712814331055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,4,power_law_1.01,2.8483903884887694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,4,power_law_1.2,2.824640083312988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,4,power_law_1.2,2.8389631271362306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,64,balanced,0.870581309000651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,64,balanced,0.8717652956644694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,64,power_law_1.01,0.9529919624328613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,64,power_law_1.01,0.958124828338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,64,power_law_1.2,0.9842047691345215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,64,power_law_1.2,0.985536003112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,8,balanced,1.5411094029744465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,8,balanced,1.5418240229288738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,8,power_law_1.01,1.7994047164916993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,8,power_law_1.01,1.8287168502807618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,8,power_law_1.2,1.8612543106079102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,1,8,power_law_1.2,1.8714815139770509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,16,1,balanced,1.8555466334025066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,16,1,balanced,1.8594719568888347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,16,1,power_law_1.01,2.3473663330078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,16,1,power_law_1.01,2.3596799850463865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,16,1,power_law_1.2,2.4199743270874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,16,1,power_law_1.2,2.429977607727051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,2,1,balanced,3.425029436747233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,2,1,balanced,3.458751996358236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,2,1,power_law_1.01,3.923455810546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,2,1,power_law_1.01,4.031558227539063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,2,1,power_law_1.2,4.055705642700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,2,1,power_law_1.2,4.163980865478516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,32,1,balanced,1.5710773468017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,32,1,balanced,1.5718666712443035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,32,1,power_law_1.01,2.0520256042480467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,32,1,power_law_1.01,2.068012809753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,32,1,power_law_1.2,2.12938232421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,32,1,power_law_1.2,2.1298112869262695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,4,1,balanced,4.897034645080566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,4,1,balanced,4.961839993794759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,4,1,power_law_1.01,4.661478424072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,4,1,power_law_1.01,4.7146240234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,4,1,power_law_1.2,4.696268844604492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,4,1,power_law_1.2,4.781273651123047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,8,1,balanced,1.2905866305033367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,8,1,balanced,1.2907360394795735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,8,1,power_law_1.01,1.5025471687316894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,8,1,power_law_1.01,1.51146240234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,8,1,power_law_1.2,1.5607872009277344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,4096,2688,22,512,8,1,power_law_1.2,1.5614848136901855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,1,balanced,2.8994134267171225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,1,balanced,3.0800374348958335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,1,power_law_1.01,3.137433624267578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,1,power_law_1.01,3.1819520950317384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,1,power_law_1.2,3.0099456787109373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,1,power_law_1.2,3.21212158203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,2,balanced,1.5558346112569172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,2,balanced,1.639909267425537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,2,power_law_1.01,2.0863487243652346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,2,power_law_1.01,2.1737600326538087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,2,power_law_1.2,1.981760025024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,2,power_law_1.2,2.327372741699219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,4,balanced,0.9384000301361084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,4,balanced,0.9424853324890137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,4,power_law_1.01,1.5260607719421386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,4,power_law_1.01,1.8280128479003905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,4,power_law_1.2,1.5368255615234374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,4,power_law_1.2,1.666534423828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,8,balanced,0.6002346674601237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,8,balanced,0.6018186807632446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,8,power_law_1.01,1.387615966796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,8,power_law_1.01,1.3995136260986327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,8,power_law_1.2,1.3846847534179687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,1,8,power_law_1.2,1.3910271644592285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,16,1,balanced,0.24683199326197305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,16,1,balanced,0.24685333172480264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,16,1,power_law_1.01,0.25759360790252683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,16,1,power_law_1.01,0.275929594039917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,16,1,power_law_1.2,0.2594559907913208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,16,1,power_law_1.2,0.27036800384521487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,2,1,balanced,1.45634126663208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,2,1,balanced,1.4721760749816895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,2,1,power_law_1.01,1.5693696022033692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,2,1,power_law_1.01,1.5730815887451173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,2,1,power_law_1.2,1.563430404663086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,2,1,power_law_1.2,1.5701567649841308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,32,1,balanced,0.16198933124542236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,32,1,balanced,0.1623360017935435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,32,1,power_law_1.01,0.16940159797668458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,32,1,power_law_1.01,0.17957760095596315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,32,1,power_law_1.2,0.17134079933166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,32,1,power_law_1.2,0.17564159631729126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,4,1,balanced,0.7400533358256022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,4,1,balanced,0.7572960058848063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,4,1,power_law_1.01,0.8045439720153809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,4,1,power_law_1.01,0.8320832252502441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,4,1,power_law_1.2,0.8133248329162598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,4,1,power_law_1.2,0.8288000106811524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,8,1,balanced,0.4140213330586751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,8,1,balanced,0.41730133692423504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,8,1,power_law_1.01,0.44467840194702146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,8,1,power_law_1.01,0.4460159778594971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,8,1,power_law_1.2,0.4398399829864502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,16384,2,8,8,1,power_law_1.2,0.44153599739074706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,1,balanced,3.872250556945801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,1,balanced,4.009946823120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,1,power_law_1.01,4.3102783203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,1,power_law_1.01,4.371072006225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,1,power_law_1.2,4.4979713439941404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,1,power_law_1.2,4.656089782714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,128,balanced,0.37012267112731934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,128,balanced,0.37061866124471027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,128,power_law_1.01,0.4077184200286865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,128,power_law_1.01,0.4123136043548584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,128,power_law_1.2,0.4207359790802002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,128,power_law_1.2,0.4219264030456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,16,balanced,0.5570400158564249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,16,balanced,0.5583306550979614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,16,power_law_1.01,0.6253695964813233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,16,power_law_1.01,0.6261631965637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,16,power_law_1.2,0.6462207794189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,16,power_law_1.2,0.6716288089752197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,2,balanced,2.1198827425638833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,2,balanced,2.189199924468994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,2,power_law_1.01,2.3165376663208006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,2,power_law_1.01,2.3457279205322266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,2,power_law_1.2,2.410758399963379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,2,power_law_1.2,2.448748779296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,256,balanced,0.3617173433303833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,256,balanced,0.36353600025177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,256,power_law_1.01,0.3845952033996582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,256,power_law_1.01,0.386847996711731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,256,power_law_1.2,0.40435199737548827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,256,power_law_1.2,0.4164415836334229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,32,balanced,0.45129064718882245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,32,balanced,0.4517279863357544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,32,power_law_1.01,0.4989312171936035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,32,power_law_1.01,0.49898881912231446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,32,power_law_1.2,0.5176767826080322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,32,power_law_1.2,0.5385407924652099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,4,balanced,1.1933973630269368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,4,balanced,1.215557336807251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,4,power_law_1.01,1.3368767738342284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,4,power_law_1.01,1.3447168350219727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,4,power_law_1.2,1.3836223602294921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,4,power_law_1.2,1.439468765258789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,64,balanced,0.39236267407735187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,64,balanced,0.39321601390838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,64,power_law_1.01,0.4465151786804199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,64,power_law_1.01,0.4490367889404297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,64,power_law_1.2,0.4594880104064941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,64,power_law_1.2,0.46091518402099607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,8,balanced,0.7682507038116455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,8,balanced,0.7698293526967367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,8,power_law_1.01,0.8682687759399415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,8,power_law_1.01,0.871776008605957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,8,power_law_1.2,0.8624959945678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,1,8,power_law_1.2,0.9275199890136718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,16,1,balanced,0.509061336517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,16,1,balanced,0.5103040138880411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,16,1,power_law_1.01,0.5798592090606689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,16,1,power_law_1.01,0.5842688083648682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,16,1,power_law_1.2,0.5915328025817871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,16,1,power_law_1.2,0.5924736022949219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,2,1,balanced,2.042912006378174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,2,1,balanced,2.060863971710205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,2,1,power_law_1.01,2.1698688507080077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,2,1,power_law_1.01,2.1744831085205076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,2,1,power_law_1.2,2.2303871154785155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,2,1,power_law_1.2,2.4070528030395506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,32,1,balanced,0.406879981358846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,32,1,balanced,0.41038934389750165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,32,1,power_law_1.01,0.4744256019592285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,32,1,power_law_1.01,0.47583999633789065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,32,1,power_law_1.2,0.48613758087158204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,32,1,power_law_1.2,0.48842878341674806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,4,1,balanced,1.1200106938680012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,4,1,balanced,1.1373546918233235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,4,1,power_law_1.01,1.2239359855651855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,4,1,power_law_1.01,1.2244735717773438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,4,1,power_law_1.2,1.2803711891174316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,4,1,power_law_1.2,1.283891201019287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,8,1,balanced,0.7189386685689291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,8,1,balanced,0.7197173436482748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,8,1,power_law_1.01,0.7867263793945313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,8,1,power_law_1.01,0.7908415794372559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,8,1,power_law_1.2,0.8071743965148925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2048,8,256,8,1,power_law_1.2,0.8084927558898926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,1,balanced,3.1512374877929688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,1,balanced,3.1794398625691733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,1,power_law_1.01,4.062707138061524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,1,power_law_1.01,4.192582321166992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,1,power_law_1.2,4.2031806945800785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,1,power_law_1.2,4.374854278564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,16,balanced,0.49790934721628827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,16,balanced,0.49848000208536786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,16,power_law_1.01,0.6181375980377197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,16,power_law_1.01,0.634822416305542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,16,power_law_1.2,0.6678912162780761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,16,power_law_1.2,0.6727359771728516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,2,balanced,1.7392160097757976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,2,balanced,1.7584692637125652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,2,power_law_1.01,2.1501760482788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,2,power_law_1.01,2.194566345214844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,2,power_law_1.2,2.1986560821533203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,2,power_law_1.2,2.2715007781982424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,32,balanced,0.4100106557210286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,32,balanced,0.41147732734680176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,32,power_law_1.01,0.5060480117797852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,32,power_law_1.01,0.5187903881072998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,32,power_law_1.2,0.5416384220123291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,32,power_law_1.2,0.5676415920257568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,4,balanced,1.0064106782277424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,4,balanced,1.0079306761423747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,4,power_law_1.01,1.2850624084472657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,4,power_law_1.01,1.3214271545410157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,4,power_law_1.2,1.341222381591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,4,power_law_1.2,1.3528639793395996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,8,balanced,0.667685349782308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,8,balanced,0.6677707036336263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,8,power_law_1.01,0.8329536437988281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,8,power_law_1.01,0.861574363708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,8,power_law_1.2,0.8641087532043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,1,8,power_law_1.2,0.9082495689392089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,16,1,balanced,0.4379359881083171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,16,1,balanced,0.43957332770029706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,16,1,power_law_1.01,0.530406379699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,16,1,power_law_1.01,0.5305727958679199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,16,1,power_law_1.2,0.5364160060882568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,16,1,power_law_1.2,0.5365695953369141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,2,1,balanced,1.641599973042806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,2,1,balanced,1.6479040781656902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,2,1,power_law_1.01,1.9932992935180665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,2,1,power_law_1.01,2.0666175842285157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,2,1,power_law_1.2,2.061471939086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,2,1,power_law_1.2,2.0772607803344725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,32,1,balanced,0.39477332433064777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,32,1,balanced,0.3951306740442912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,32,1,power_law_1.01,0.442137622833252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,32,1,power_law_1.01,0.4425983905792236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,32,1,power_law_1.2,0.4456639766693115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,32,1,power_law_1.2,0.4496767997741699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,4,1,balanced,0.9384053548177084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,4,1,balanced,0.947983980178833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,4,1,power_law_1.01,1.1386816024780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,4,1,power_law_1.01,1.1395456314086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,4,1,power_law_1.2,1.1537728309631348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,4,1,power_law_1.2,1.1673727989196778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,8,1,balanced,0.5782080094019572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,8,1,balanced,0.5792160034179688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,8,1,power_law_1.01,0.7174592018127441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,8,1,power_law_1.01,0.7226367950439453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,8,1,power_law_1.2,0.730463981628418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,6144,2560,8,160,8,1,power_law_1.2,0.7307392120361328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,1,balanced,4.515242576599121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,1,balanced,4.563551902770996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,1,power_law_1.01,4.867884826660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,1,power_law_1.01,4.948428726196289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,1,power_law_1.2,5.247404861450195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,1,power_law_1.2,5.404563140869141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,128,balanced,0.40651198228200275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,128,balanced,0.40719465414683026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,128,power_law_1.01,0.44773120880126954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,128,power_law_1.01,0.4537536144256592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,128,power_law_1.2,0.47405438423156737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,128,power_law_1.2,0.4807295799255371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,16,balanced,0.6275999943415324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,16,balanced,0.6290880044301351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,16,power_law_1.01,0.7080448150634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,16,power_law_1.01,0.7160704135894775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,16,power_law_1.2,0.7253824234008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,16,power_law_1.2,0.7543360233306885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,2,balanced,2.58897066116333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,2,balanced,2.6709280014038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,2,power_law_1.01,2.631315231323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,2,power_law_1.01,2.676268768310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,2,power_law_1.2,2.783296012878418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,2,power_law_1.2,2.7980415344238283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,256,balanced,0.3982613484064738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,256,balanced,0.3991359869639079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,256,power_law_1.01,0.4246784210205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,256,power_law_1.01,0.42876157760620115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,256,power_law_1.2,0.45525760650634767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,256,power_law_1.2,0.46048641204833984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,32,balanced,0.5011253356933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,32,balanced,0.5020426511764526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,32,power_law_1.01,0.554643201828003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,32,power_law_1.01,0.560652780532837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,32,power_law_1.2,0.583193588256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,32,power_law_1.2,0.5842048168182373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,4,balanced,1.3805920282999675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,4,balanced,1.3823466300964355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,4,power_law_1.01,1.5381695747375488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,4,power_law_1.01,1.548192024230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,4,power_law_1.2,1.5419136047363282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,4,power_law_1.2,1.5528063774108887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,64,balanced,0.43356800079345703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,64,balanced,0.43503467241923016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,64,power_law_1.01,0.4917312145233154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,64,power_law_1.01,0.49377918243408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,64,power_law_1.2,0.50797438621521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,64,power_law_1.2,0.5251967906951904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,8,balanced,0.8728693326314291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,8,balanced,0.8756799697875977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,8,power_law_1.01,0.9814208030700684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,8,power_law_1.01,0.9947711944580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,8,power_law_1.2,1.022099208831787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,1,8,power_law_1.2,1.0447168350219727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,16,1,balanced,0.5883520046869913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,16,1,balanced,0.5888533194859823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,16,1,power_law_1.01,0.6691328048706054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,16,1,power_law_1.01,0.672819185256958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,16,1,power_law_1.2,0.6821951866149902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,16,1,power_law_1.2,0.6885248184204101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,2,1,balanced,2.3334827423095703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,2,1,balanced,2.4575146039326987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,2,1,power_law_1.01,2.4999231338500976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,2,1,power_law_1.01,2.519264030456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,2,1,power_law_1.2,2.70263671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,2,1,power_law_1.2,2.7408447265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,32,1,balanced,0.4676320155461629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,32,1,balanced,0.46906665960947674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,32,1,power_law_1.01,0.5465472221374512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,32,1,power_law_1.01,0.5478847980499267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,32,1,power_law_1.2,0.5580351829528809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,32,1,power_law_1.2,0.5645823955535889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,4,1,balanced,1.2903839747111003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,4,1,balanced,1.3237760066986084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,4,1,power_law_1.01,1.4116864204406738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,4,1,power_law_1.01,1.4386303901672364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,4,1,power_law_1.2,1.481651210784912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,4,1,power_law_1.2,1.4822336196899415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,8,1,balanced,0.8339146773020426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,8,1,balanced,0.8360053698221842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,8,1,power_law_1.01,0.919372844696045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,8,1,power_law_1.01,0.9225664138793945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,8,1,power_law_1.2,0.937337589263916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,256,8,1,power_law_1.2,0.9406975746154785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,1,balanced,6.751466751098633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,1,balanced,6.898426691691081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,1,power_law_1.01,6.510387420654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,1,power_law_1.01,6.525260925292969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,1,power_law_1.2,7.109945678710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,1,power_law_1.2,7.231353759765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,128,balanced,0.4774186611175537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,128,balanced,0.477946678797404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,128,power_law_1.01,0.5037312030792236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,128,power_law_1.01,0.5113279819488525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,128,power_law_1.2,0.5262400150299072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,128,power_law_1.2,0.5267648220062255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,16,balanced,0.8015626271565756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,16,balanced,0.8036320209503174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,16,power_law_1.01,0.8503359794616699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,16,power_law_1.01,0.8692992210388184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,16,power_law_1.2,0.85731201171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,16,power_law_1.2,0.8801088333129883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,2,balanced,3.4928693771362305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,2,balanced,3.737717310587565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,2,power_law_1.01,3.457478332519531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,2,power_law_1.01,3.4974910736083986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,2,power_law_1.2,3.548761749267578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,2,power_law_1.2,3.6942657470703124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,32,balanced,0.6226133505503336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,32,balanced,0.6239413420359293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,32,power_law_1.01,0.6425280094146728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,32,power_law_1.01,0.664083194732666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,32,power_law_1.2,0.6924928188323974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,32,power_law_1.2,0.7035967826843261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,4,balanced,1.9129707018534343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,4,balanced,1.9188906351725261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,4,power_law_1.01,1.8555967330932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,4,power_law_1.01,1.8992895126342773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,4,power_law_1.2,2.0448320388793944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,4,power_law_1.2,2.055059242248535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,64,balanced,0.5218666791915894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,64,balanced,0.5227146546045939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,64,power_law_1.01,0.5668992042541504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,64,power_law_1.01,0.5689023971557617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,64,power_law_1.2,0.5824639797210693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,64,power_law_1.2,0.5884992122650147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,8,balanced,1.1785173416137695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,8,balanced,1.1815679868062336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,8,power_law_1.01,1.2072256088256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,8,power_law_1.01,1.2232064247131347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,8,power_law_1.2,1.2204095840454101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,1,8,power_law_1.2,1.2589056015014648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,16,1,balanced,0.7956746419270834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,16,1,balanced,0.7988106409708658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,16,1,power_law_1.01,0.7880064010620117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,16,1,power_law_1.01,0.7937215805053711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,16,1,power_law_1.2,0.8092543601989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,16,1,power_law_1.2,0.8117823600769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,2,1,balanced,3.4602133433024087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,2,1,balanced,3.4822667439778647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,2,1,power_law_1.01,3.319660949707031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,2,1,power_law_1.01,3.356524658203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,2,1,power_law_1.2,3.474425506591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,2,1,power_law_1.2,3.5673599243164062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,32,1,balanced,0.6471413373947144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,32,1,balanced,0.6480640172958374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,32,1,power_law_1.01,0.6479551792144775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,32,1,power_law_1.01,0.6487232208251953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,32,1,power_law_1.2,0.6637760162353515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,32,1,power_law_1.2,0.6654784202575683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,4,1,balanced,1.8517386118570964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,4,1,balanced,1.913914680480957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,4,1,power_law_1.01,1.7923904418945313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,4,1,power_law_1.01,1.812883186340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,4,1,power_law_1.2,1.9087104797363281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,4,1,power_law_1.2,1.9197120666503906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,8,1,balanced,1.1622933546702068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,8,1,balanced,1.1659680207570393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,8,1,power_law_1.01,1.1424575805664063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,8,1,power_law_1.01,1.1443967819213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,8,1,power_law_1.2,1.1736191749572753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,2048,7168,2048,8,384,8,1,power_law_1.2,1.1811519622802735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,1,balanced,0.21573867400487265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,1,balanced,0.2158986727396647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,1,power_law_1.01,0.2372607946395874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,1,power_law_1.01,0.23836159706115723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,1,power_law_1.2,0.2425152063369751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,1,power_law_1.2,0.24314239025115966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,128,balanced,0.04859200119972229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,128,balanced,0.05072000126043955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,128,power_law_1.01,0.04890879988670349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,128,power_law_1.01,0.05002880096435547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,128,power_law_1.2,0.04898560047149658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,128,power_law_1.2,0.04913919866085052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,16,balanced,0.058037335673967995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,16,balanced,0.05921066800753275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,16,power_law_1.01,0.05626239776611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,16,power_law_1.01,0.056505602598190305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,16,power_law_1.2,0.05850239992141724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,16,power_law_1.2,0.058764797449111936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,2,balanced,0.13891200224558511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,2,balanced,0.14289066195487976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,2,power_law_1.01,0.13553279638290405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,2,power_law_1.01,0.1363968014717102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,2,power_law_1.2,0.13660800457000732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,2,power_law_1.2,0.13839999437332154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,32,balanced,0.04994666576385498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,32,balanced,0.0499946673711141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,32,power_law_1.01,0.04831359982490539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,32,power_law_1.01,0.04839679896831513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,32,power_law_1.2,0.04906240105628967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,32,power_law_1.2,0.05066879987716675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,4,balanced,0.09477866689364116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,4,balanced,0.09518399834632874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,4,power_law_1.01,0.09114239811897278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,4,power_law_1.01,0.09293439984321594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,4,power_law_1.2,0.0927295982837677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,4,power_law_1.2,0.09337599873542786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,64,balanced,0.04797866443792979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,64,balanced,0.04867733518282572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,64,power_law_1.01,0.04733439981937408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,64,power_law_1.01,0.04775039851665497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,64,power_law_1.2,0.04754559993743897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,64,power_law_1.2,0.04764159917831421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,8,balanced,0.07005333403746287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,8,balanced,0.07249600191911061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,8,power_law_1.01,0.07039999961853027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,8,power_law_1.01,0.0704255998134613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,8,power_law_1.2,0.06964480280876159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,1,8,power_law_1.2,0.07033600211143494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,2,1,balanced,0.13618133465449014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,2,1,balanced,0.13659200072288513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,2,1,power_law_1.01,0.1302847981452942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,2,1,power_law_1.01,0.13098880052566528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,2,1,power_law_1.2,0.13224320411682128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,2,1,power_law_1.2,0.13230719566345214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,4,1,balanced,0.0905013382434845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,4,1,balanced,0.09097066521644592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,4,1,power_law_1.01,0.08710399866104127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,4,1,power_law_1.01,0.0876416027545929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,4,1,power_law_1.2,0.08844159841537476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2048,768,8,128,4,1,power_law_1.2,0.08862720131874084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,1,balanced,0.600272019704183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,1,balanced,0.6027946472167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,1,power_law_1.01,0.6074304103851318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,1,power_law_1.01,0.6075903892517089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,1,power_law_1.2,0.6101759910583496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,1,power_law_1.2,0.6230720043182373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,128,balanced,0.06842133402824402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,128,balanced,0.06864533325036366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,128,power_law_1.01,0.06774399876594543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,128,power_law_1.01,0.06846719980239868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,128,power_law_1.2,0.06933760046958923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,128,power_law_1.2,0.0694208025932312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,16,balanced,0.08895466725031535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,16,balanced,0.09032000104586284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,16,power_law_1.01,0.08760960102081299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,16,power_law_1.01,0.08805760145187377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,16,power_law_1.2,0.08886399865150452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,16,power_law_1.2,0.08904320001602173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,2,balanced,0.3621866703033447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,2,balanced,0.36872533957163495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,2,power_law_1.01,0.3295936107635498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,2,power_law_1.01,0.34472320079803465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,2,power_law_1.2,0.3475071907043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,2,power_law_1.2,0.35688319206237795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,32,balanced,0.07832533121109009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,32,balanced,0.07933866480986278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,32,power_law_1.01,0.07603840231895446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,32,power_law_1.01,0.07604479789733887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,32,power_law_1.2,0.07793920040130616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,32,power_law_1.2,0.07822080254554749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,4,balanced,0.21319466829299927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,4,balanced,0.21411732832590738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,4,power_law_1.01,0.19635839462280275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,4,power_law_1.01,0.19907840490341186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,4,power_law_1.2,0.19786880016326905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,4,power_law_1.2,0.2065664052963257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,64,balanced,0.07028799752394359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,64,balanced,0.0703359991312027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,64,power_law_1.01,0.07141759991645813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,64,power_law_1.01,0.07193599939346314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,64,power_law_1.2,0.07018240094184876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,64,power_law_1.2,0.07174400091171265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,8,balanced,0.13657066226005554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,8,balanced,0.13793067137400308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,8,power_law_1.01,0.1232192039489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,8,power_law_1.01,0.13249919414520264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,8,power_law_1.2,0.13428479433059692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,1,8,power_law_1.2,0.13854080438613892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,16,1,balanced,0.22288533051808676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,16,1,balanced,0.22296533981959024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,16,1,power_law_1.01,0.20801920890808107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,16,1,power_law_1.01,0.2094655990600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,16,1,power_law_1.2,0.21519360542297364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,16,1,power_law_1.2,0.21691520214080812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,2,1,balanced,0.3526560068130493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,2,1,balanced,0.35414401690165204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,2,1,power_law_1.01,0.32751998901367185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,2,1,power_law_1.01,0.33165440559387205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,2,1,power_law_1.2,0.34399359226226806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,2,1,power_law_1.2,0.34708480834960936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,32,1,balanced,0.19090133905410767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,32,1,balanced,0.19129067659378052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,32,1,power_law_1.01,0.1777151942253113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,32,1,power_law_1.01,0.18190079927444458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,32,1,power_law_1.2,0.185862398147583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,32,1,power_law_1.2,0.1862272024154663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,4,1,balanced,0.2092640002568563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,4,1,balanced,0.20973867177963257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,4,1,power_law_1.01,0.197817599773407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,4,1,power_law_1.01,0.19928319454193116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,4,1,power_law_1.2,0.20390400886535645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,4,1,power_law_1.2,0.20511360168457032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,8,1,balanced,0.32497066259384155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,8,1,balanced,0.32602133353551227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,8,1,power_law_1.01,0.30298240184783937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,8,1,power_law_1.01,0.3049216032028198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,8,1,power_law_1.2,0.31371519565582273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,2688,1856,6,128,8,1,power_law_1.2,0.31738240718841554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,1,balanced,1.1723253726959229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,1,balanced,1.189909299214681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,1,power_law_1.01,0.9965888023376465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,1,power_law_1.01,1.0068991661071778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,1,power_law_1.2,1.0094592094421386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,1,power_law_1.2,1.0138879776000977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,128,balanced,0.1027893324693044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,128,balanced,0.10335999727249146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,128,power_law_1.01,0.10058879852294922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,128,power_law_1.01,0.10061440467834473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,128,power_law_1.2,0.10156160593032837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,128,power_law_1.2,0.10202879905700683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,16,balanced,0.1628159979979197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,16,balanced,0.16365333398183188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,16,power_law_1.01,0.14703999757766723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,16,power_law_1.01,0.15665279626846312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,16,power_law_1.2,0.15404800176620484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,16,power_law_1.2,0.15489280223846436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,2,balanced,0.6236000061035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,2,balanced,0.6283733447392782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,2,power_law_1.01,0.5639808177947998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,2,power_law_1.01,0.5798719882965088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,2,power_law_1.2,0.5491199970245362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,2,power_law_1.2,0.5649151802062988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,256,balanced,0.10114133358001709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,256,balanced,0.101200004418691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,256,power_law_1.01,0.10033279657363892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,256,power_law_1.01,0.10033919811248779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,256,power_law_1.2,0.10068479776382447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,256,power_law_1.2,0.10205440521240235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,32,balanced,0.11732799808184306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,32,balanced,0.11956266562143962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,32,power_law_1.01,0.11450879573822022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,32,power_law_1.01,0.11463040113449097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,32,power_law_1.2,0.11508480310440064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,32,power_law_1.2,0.11527040004730224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,4,balanced,0.363103985786438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,4,balanced,0.36549333731333417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,4,power_law_1.01,0.3339839935302734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,4,power_law_1.01,0.33646719455718993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,4,power_law_1.2,0.337606406211853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,4,power_law_1.2,0.3395776033401489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,64,balanced,0.10902933279673259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,64,balanced,0.1092800001303355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,64,power_law_1.01,0.10621440410614014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,64,power_law_1.01,0.10692479610443115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,64,power_law_1.2,0.10696320533752442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,64,power_law_1.2,0.10703359842300415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,8,balanced,0.22593599557876587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,8,balanced,0.22613867123921713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,8,power_law_1.01,0.20887041091918945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,8,power_law_1.01,0.21410560607910156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,8,power_law_1.2,0.20949759483337402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,1,8,power_law_1.2,0.21407999992370605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,16,1,balanced,0.16657599806785583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,16,1,balanced,0.16859734058380127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,16,1,power_law_1.01,0.1410752058029175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,16,1,power_law_1.01,0.14191999435424804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,16,1,power_law_1.2,0.1507200002670288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,16,1,power_law_1.2,0.15459200143814086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,2,1,balanced,0.6076480150222778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,2,1,balanced,0.6083573500315348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,2,1,power_law_1.01,0.5221183776855469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,2,1,power_law_1.01,0.5281983852386475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,2,1,power_law_1.2,0.5240064144134522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,2,1,power_law_1.2,0.5293312072753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,32,1,balanced,0.12388267119725545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,32,1,balanced,0.12547733386357626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,32,1,power_law_1.01,0.11832959651947021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,32,1,power_law_1.01,0.11854720115661621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,32,1,power_law_1.2,0.11804159879684448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,32,1,power_law_1.2,0.11870720386505126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,4,1,balanced,0.3402293523152669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,4,1,balanced,0.3405760129292806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,4,1,power_law_1.01,0.2948352098464966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,4,1,power_law_1.01,0.299180793762207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,4,1,power_law_1.2,0.3020224094390869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,4,1,power_law_1.2,0.30432639122009275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,8,1,balanced,0.20829866329828897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,8,1,balanced,0.20892800887425741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,8,1,power_law_1.01,0.19279359579086303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,8,1,power_law_1.01,0.19479039907455445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,8,1,power_law_1.2,0.19496959447860718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,3072,1536,8,256,8,1,power_law_1.2,0.195251202583313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,1,balanced,0.5321600039800009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,1,balanced,0.5322133302688599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,1,power_law_1.01,0.6539519786834717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,1,power_law_1.01,0.6548031806945801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,1,power_law_1.2,0.6452735900878906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,1,power_law_1.2,0.6950784206390381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,2,balanced,0.3499679962793986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,2,balanced,0.3509440024693807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,2,power_law_1.01,0.43415679931640627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,2,power_law_1.01,0.4345280170440674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,2,power_law_1.2,0.4253119945526123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,2,power_law_1.2,0.4546175956726074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,4,balanced,0.2661973237991333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,4,balanced,0.2705013354619344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,4,power_law_1.01,0.32196478843688964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,4,power_law_1.01,0.3369856119155884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,4,power_law_1.2,0.32264959812164307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,4,power_law_1.2,0.3285056114196777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,8,balanced,0.23034133513768515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,8,balanced,0.230730672677358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,8,power_law_1.01,0.26737279891967775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,8,power_law_1.01,0.2698879957199097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,8,power_law_1.2,0.26589438915252683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,1,8,power_law_1.2,0.2659392118453979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,16,1,balanced,0.08082666496435802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,16,1,balanced,0.08262399832407634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,16,1,power_law_1.01,0.0819711983203888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,16,1,power_law_1.01,0.08506240248680115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,16,1,power_law_1.2,0.08158079981803894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,16,1,power_law_1.2,0.08261759877204895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,2,1,balanced,0.29469867547353107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,2,1,balanced,0.29595200220743817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,2,1,power_law_1.01,0.3266688108444214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,2,1,power_law_1.01,0.33056640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,2,1,power_law_1.2,0.32842240333557127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,2,1,power_law_1.2,0.33660159111022947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,32,1,balanced,0.06428266565004985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,32,1,balanced,0.06449066599210103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,32,1,power_law_1.01,0.07083520293235779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,32,1,power_law_1.01,0.07117440104484558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,32,1,power_law_1.2,0.0692799985408783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,32,1,power_law_1.2,0.07063040137290955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,4,1,balanced,0.17883733908335367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,4,1,balanced,0.1805760065714518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,4,1,power_law_1.01,0.17323520183563232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,4,1,power_law_1.01,0.18168959617614747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,4,1,power_law_1.2,0.1739840030670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,4,1,power_law_1.2,0.17993600368499757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,8,1,balanced,0.10322133700052898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,8,1,balanced,0.1053493320941925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,8,1,power_law_1.01,0.10135680437088013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,8,1,power_law_1.01,0.10602879524230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,8,1,power_law_1.2,0.10391039848327636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,14336,2,8,8,1,power_law_1.2,0.10539519786834717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,1,balanced,0.7889546553293864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,1,balanced,0.7909706433614095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,1,power_law_1.01,0.7669504165649415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,1,power_law_1.01,0.7782015800476074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,1,power_law_1.2,0.7925312042236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,1,power_law_1.2,0.7993792057037353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,128,balanced,0.08347733815511067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,128,balanced,0.08538132905960083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,128,power_law_1.01,0.08478720188140869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,128,power_law_1.01,0.08613119721412658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,128,power_law_1.2,0.08475520014762879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,128,power_law_1.2,0.08693119883537292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,16,balanced,0.11754133303960164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,16,balanced,0.11760000387827556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,16,power_law_1.01,0.11585279703140258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,16,power_law_1.01,0.11791360378265381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,16,power_law_1.2,0.11624319553375244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,16,power_law_1.2,0.11805440187454223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,2,balanced,0.4390079975128174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,2,balanced,0.44044268131256104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,2,power_law_1.01,0.42899198532104493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,2,power_law_1.01,0.43201918601989747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,2,power_law_1.2,0.43517441749572755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,2,power_law_1.2,0.43576321601867674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,32,balanced,0.10293866197268169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,32,balanced,0.10338133573532104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,32,power_law_1.01,0.10386559963226319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,32,power_law_1.01,0.10496640205383301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,32,power_law_1.2,0.10370559692382812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,32,power_law_1.2,0.10402560234069824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,4,balanced,0.25459200143814087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,4,balanced,0.25484800338745117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,4,power_law_1.01,0.25033600330352784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,4,power_law_1.01,0.2519551992416382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,4,power_law_1.2,0.24573440551757814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,4,power_law_1.2,0.24758400917053222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,64,balanced,0.09699733058611552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,64,balanced,0.09912000099817912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,64,power_law_1.01,0.09628159999847412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,64,power_law_1.01,0.09653120040893555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,64,power_law_1.2,0.09630079865455628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,64,power_law_1.2,0.09713280200958252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,8,balanced,0.16404799620310465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,8,balanced,0.1665173371632894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,8,power_law_1.01,0.16457600593566896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,8,power_law_1.01,0.16462719440460205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,8,power_law_1.2,0.17419519424438476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,1,8,power_law_1.2,0.17838079929351808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,16,1,balanced,0.12379200259844463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,16,1,balanced,0.12410666545232137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,16,1,power_law_1.01,0.12197760343551636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,16,1,power_law_1.01,0.12199679613113404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,16,1,power_law_1.2,0.1229632019996643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,16,1,power_law_1.2,0.12311680316925049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,2,1,balanced,0.3994186719258626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,2,1,balanced,0.4038613239924113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,2,1,power_law_1.01,0.4332608222961426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,2,1,power_law_1.01,0.4425792217254639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,2,1,power_law_1.2,0.44515838623046877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,2,1,power_law_1.2,0.44756479263305665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,32,1,balanced,0.10868799686431885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,32,1,balanced,0.10910399754842122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,32,1,power_law_1.01,0.10737279653549195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,32,1,power_law_1.01,0.1076159954071045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,32,1,power_law_1.2,0.10857599973678589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,32,1,power_law_1.2,0.1096384048461914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,4,1,balanced,0.24043200413386026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,4,1,balanced,0.2411253253618876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,4,1,power_law_1.01,0.23597440719604493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,4,1,power_law_1.01,0.23614718914031982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,4,1,power_law_1.2,0.23751039505004884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,4,1,power_law_1.2,0.23844480514526367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,8,1,balanced,0.1564586659272512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,8,1,balanced,0.15654399991035461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,8,1,power_law_1.01,0.15164799690246583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,8,1,power_law_1.01,0.1534335970878601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,8,1,power_law_1.2,0.1515712022781372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,1536,8,128,8,1,power_law_1.2,0.15363199710845948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,1,balanced,5.298901240030925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,1,balanced,5.51478385925293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,1,power_law_1.01,4.920633697509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,1,power_law_1.01,4.945676803588867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,1,power_law_1.2,4.96300163269043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,1,power_law_1.2,5.19854736328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,128,balanced,0.31385066111882526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,128,balanced,0.3139253258705139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,128,power_law_1.01,0.3115520000457764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,128,power_law_1.01,0.31157119274139405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,128,power_law_1.2,0.31948161125183105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,128,power_law_1.2,0.3207231998443604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,16,balanced,0.6157600084940592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,16,balanced,0.6165813207626343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,16,power_law_1.01,0.5749248027801513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,16,power_law_1.01,0.5877567768096924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,16,power_law_1.2,0.6032320022583008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,16,power_law_1.2,0.6040448188781739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,2,balanced,2.854640007019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,2,balanced,2.868373235066732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,2,power_law_1.01,2.5589311599731444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,2,power_law_1.01,2.605446434020996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,2,power_law_1.2,2.7082496643066407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,2,power_law_1.2,2.7154752731323244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,256,balanced,0.30179200569788617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,256,balanced,0.3035306731859843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,256,power_law_1.01,0.300927996635437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,256,power_law_1.01,0.3019968032836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,256,power_law_1.2,0.3062272071838379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,256,power_law_1.2,0.3062335968017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,32,balanced,0.4487413167953491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,32,balanced,0.4487573305765788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,32,power_law_1.01,0.4374783992767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,32,power_law_1.01,0.44119038581848147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,32,power_law_1.2,0.4398208141326904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,32,power_law_1.2,0.4457856178283691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,4,balanced,1.5373867352803547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,4,balanced,1.5379892985026042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,4,power_law_1.01,1.406931209564209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,4,power_law_1.01,1.4342528343200684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,4,power_law_1.2,1.454867172241211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,4,power_law_1.2,1.472531223297119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,64,balanced,0.34700266520182294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,64,balanced,0.3476853370666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,64,power_law_1.01,0.3319744110107422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,64,power_law_1.01,0.3454655885696411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,64,power_law_1.2,0.3661887884140015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,64,power_law_1.2,0.36830079555511475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,8,balanced,0.9204426606496176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,8,balanced,0.9204586346944174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,8,power_law_1.01,0.8606847763061524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,8,power_law_1.01,0.8898431777954101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,8,power_law_1.2,0.8838015556335449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,1,8,power_law_1.2,0.8899711608886719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,16,1,balanced,1.4666506449381511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,16,1,balanced,1.4693013827006023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,16,1,power_law_1.01,1.3598976135253906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,16,1,power_law_1.01,1.367027187347412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,16,1,power_law_1.2,1.420032024383545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,16,1,power_law_1.2,1.4340543746948242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,2,1,balanced,2.5203466415405273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,2,1,balanced,2.5411200523376465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,2,1,power_law_1.01,2.4136703491210936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,2,1,power_law_1.01,2.4293695449829102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,2,1,power_law_1.2,2.4674495697021483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,2,1,power_law_1.2,2.5065216064453124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,32,1,balanced,1.159717321395874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,32,1,balanced,1.1617813110351562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,32,1,power_law_1.01,1.0753791809082032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,32,1,power_law_1.01,1.0795519828796387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,32,1,power_law_1.2,1.1260607719421387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,32,1,power_law_1.2,1.1339200019836426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,4,1,balanced,1.440069357554118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,4,1,balanced,1.4464747111002605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,4,1,power_law_1.01,1.3946368217468261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,4,1,power_law_1.01,1.3995712280273438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,4,1,power_law_1.2,1.4499263763427734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,4,1,power_law_1.2,1.4586751937866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,8,1,balanced,0.7940693696339926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,8,1,balanced,0.7995786666870117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,8,1,power_law_1.01,0.7449344158172607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,8,1,power_law_1.01,0.7508224010467529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,8,1,power_law_1.2,0.7651072025299073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,4096,2688,22,512,8,1,power_law_1.2,0.7661888122558593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,1,balanced,0.8272906939188639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,1,balanced,0.8301440080006918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,1,power_law_1.01,1.1224703788757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,1,power_law_1.01,1.1409215927124023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,1,power_law_1.2,1.1223936080932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,1,power_law_1.2,1.1669183731079102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,2,balanced,0.49936532974243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,2,balanced,0.5018933216730753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,2,power_law_1.01,0.6142399787902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,2,power_law_1.01,0.6825535774230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,2,power_law_1.2,0.6616511821746827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,2,power_law_1.2,0.6616960048675538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,4,balanced,0.3495733340581258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,4,balanced,0.3524106740951538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,4,power_law_1.01,0.4403711795806885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,4,power_law_1.01,0.4459712028503418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,4,power_law_1.2,0.44121599197387695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,4,power_law_1.2,0.45922560691833497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,8,balanced,0.2814720074335734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,8,balanced,0.28149332602818805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,8,power_law_1.01,0.34050559997558594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,8,power_law_1.01,0.3423935890197754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,8,power_law_1.2,0.33306241035461426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,1,8,power_law_1.2,0.35820798873901366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,16,1,balanced,0.10738666852315266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,16,1,balanced,0.10749866565068562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,16,1,power_law_1.01,0.11519999504089355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,16,1,power_law_1.01,0.11536639928817749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,16,1,power_law_1.2,0.11489280462265014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,16,1,power_law_1.2,0.115174400806427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,2,1,balanced,0.4485653241475423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,2,1,balanced,0.4489653507868449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,2,1,power_law_1.01,0.5485888004302979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,2,1,power_law_1.01,0.5518271923065186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,2,1,power_law_1.2,0.5482304096221924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,2,1,power_law_1.2,0.5655104160308838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,32,1,balanced,0.09238933523495992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,32,1,balanced,0.09343467156092326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,32,1,power_law_1.01,0.09745919704437256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,32,1,power_law_1.01,0.09791359901428223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,32,1,power_law_1.2,0.09618560075759888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,32,1,power_law_1.2,0.0974016010761261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,4,1,balanced,0.2627146641413371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,4,1,balanced,0.2629706660906474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,4,1,power_law_1.01,0.28782079219818113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,4,1,power_law_1.01,0.2997119903564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,4,1,power_law_1.2,0.2808192014694214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,4,1,power_law_1.2,0.2955199956893921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,8,1,balanced,0.14202133814493814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,8,1,balanced,0.14495467146237692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,8,1,power_law_1.01,0.1624127984046936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,8,1,power_law_1.01,0.1643839955329895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,8,1,power_law_1.2,0.15523200035095214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,16384,2,8,8,1,power_law_1.2,0.16418559551239015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,1,balanced,3.0960747400919595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,1,balanced,3.139967918395996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,1,power_law_1.01,2.6285375595092773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,1,power_law_1.01,2.6516096115112306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,1,power_law_1.2,2.666771125793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,1,power_law_1.2,2.683263969421387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,128,balanced,0.16856000820795694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,128,balanced,0.17006399234135947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,128,power_law_1.01,0.16603519916534423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,128,power_law_1.01,0.16709760427474976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,128,power_law_1.2,0.1663040041923523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,128,power_law_1.2,0.16716159582138063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,16,balanced,0.3301973342895508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,16,balanced,0.3309280077616374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,16,power_law_1.01,0.30977280139923097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,16,power_law_1.01,0.3162048101425171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,16,power_law_1.2,0.32014079093933107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,16,power_law_1.2,0.3224384069442749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,2,balanced,1.5950506528218586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,2,balanced,1.6213812828063965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,2,power_law_1.01,1.3921152114868165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,2,power_law_1.01,1.4057024002075196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,2,power_law_1.2,1.3828543663024901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,2,power_law_1.2,1.3893759727478028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,256,balanced,0.16690667470296225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,256,balanced,0.16819200913111368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,256,power_law_1.01,0.1633407950401306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,256,power_law_1.01,0.16368639469146729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,256,power_law_1.2,0.16323200464248658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,256,power_law_1.2,0.16382720470428466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,32,balanced,0.21566933393478394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,32,balanced,0.21766400337219238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,32,power_law_1.01,0.2017983913421631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,32,power_law_1.01,0.20412800312042237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,32,power_law_1.2,0.20396800041198732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,32,power_law_1.2,0.203987193107605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,4,balanced,0.8473493258158366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,4,balanced,0.8476906617482504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,4,power_law_1.01,0.7698495864868165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,4,power_law_1.01,0.7788415908813476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,4,power_law_1.2,0.7649663925170899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,4,power_law_1.2,0.7726655960083008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,64,balanced,0.1772800087928772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,64,balanced,0.17729600270589194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,64,power_law_1.01,0.17534719705581664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,64,power_law_1.01,0.1759552001953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,64,power_law_1.2,0.17374720573425292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,64,power_law_1.2,0.17466880083084108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,8,balanced,0.5016053517659506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,8,balanced,0.5050026575724283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,8,power_law_1.01,0.48270721435546876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,8,power_law_1.01,0.48750081062316897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,8,power_law_1.2,0.4729343891143799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,1,8,power_law_1.2,0.48385281562805177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,16,1,balanced,0.3291520078976949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,16,1,balanced,0.33026132980982464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,16,1,power_law_1.01,0.2699712038040161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,16,1,power_law_1.01,0.27491838932037355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,16,1,power_law_1.2,0.27761919498443605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,16,1,power_law_1.2,0.2863231897354126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,2,1,balanced,1.552245299021403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,2,1,balanced,1.5751892725626628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,2,1,power_law_1.01,1.3465536117553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,2,1,power_law_1.01,1.3682815551757812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,2,1,power_law_1.2,1.348851203918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,2,1,power_law_1.2,1.3508607864379882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,32,1,balanced,0.22924266258875528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,32,1,balanced,0.23009600241978964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,32,1,power_law_1.01,0.21507198810577394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,32,1,power_law_1.01,0.21647999286651612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,32,1,power_law_1.2,0.21571838855743408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,32,1,power_law_1.2,0.21668479442596436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,4,1,balanced,0.8068373203277588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,4,1,balanced,0.8078666528066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,4,1,power_law_1.01,0.7117311954498291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,4,1,power_law_1.01,0.7157887935638427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,4,1,power_law_1.2,0.7217535972595215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,4,1,power_law_1.2,0.7425343990325928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,8,1,balanced,0.48096001148223877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,8,1,balanced,0.4814560015996297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,8,1,power_law_1.01,0.4229440212249756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,8,1,power_law_1.01,0.44393601417541506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,8,1,power_law_1.2,0.4343616008758545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2048,8,256,8,1,power_law_1.2,0.44260478019714355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,1,balanced,2.4219412803649902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,1,balanced,2.459503968556722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,1,power_law_1.01,2.248703956604004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,1,power_law_1.01,2.2708480834960936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,1,power_law_1.2,2.2945344924926756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,1,power_law_1.2,2.3746816635131838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,16,balanced,0.26267733176549274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,16,balanced,0.2637653350830078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,16,power_law_1.01,0.25696640014648436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,16,power_law_1.01,0.26622719764709474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,16,power_law_1.2,0.2534463882446289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,16,power_law_1.2,0.2701184034347534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,2,balanced,1.2595360279083252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,2,balanced,1.2646880149841309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,2,power_law_1.01,1.1845888137817382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,2,power_law_1.01,1.1979840278625489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,2,power_law_1.2,1.2086848258972167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,2,power_law_1.2,1.2279999732971192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,32,balanced,0.17109866937001547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,32,balanced,0.17138665914535522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,32,power_law_1.01,0.1660863995552063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,32,power_law_1.01,0.1695296049118042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,32,power_law_1.2,0.17496320009231567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,32,power_law_1.2,0.17711360454559327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,4,balanced,0.672048012415568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,4,balanced,0.6727519830067953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,4,power_law_1.01,0.6433087825775147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,4,power_law_1.01,0.652396821975708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,4,power_law_1.2,0.6645823955535889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,4,power_law_1.2,0.6647615909576416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,8,balanced,0.3926933209101359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,8,balanced,0.39363733927408856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,8,power_law_1.01,0.3816447973251343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,8,power_law_1.01,0.3820672035217285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,8,power_law_1.2,0.39283840656280516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,1,8,power_law_1.2,0.4007999897003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,16,1,balanced,0.27211199204126996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,16,1,balanced,0.2733760078748067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,16,1,power_law_1.01,0.2565311908721924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,16,1,power_law_1.01,0.25759999752044677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,16,1,power_law_1.2,0.26610560417175294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,16,1,power_law_1.2,0.26878719329833983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,2,1,balanced,1.230079968770345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,2,1,balanced,1.2416106859842937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,2,1,power_law_1.01,1.1317248344421387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,2,1,power_law_1.01,1.1436991691589355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,2,1,power_law_1.2,1.1577664375305177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,2,1,power_law_1.2,1.1813952445983886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,32,1,balanced,0.18963199853897095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,32,1,balanced,0.1914773384730021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,32,1,power_law_1.01,0.1859071969985962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,32,1,power_law_1.01,0.1859455943107605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,32,1,power_law_1.2,0.1878335952758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,32,1,power_law_1.2,0.18854399919509887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,4,1,balanced,0.6436213254928589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,4,1,balanced,0.644320011138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,4,1,power_law_1.01,0.6187007904052735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,4,1,power_law_1.01,0.6215551853179931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,4,1,power_law_1.2,0.611411190032959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,4,1,power_law_1.2,0.6200064182281494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,8,1,balanced,0.36260799566904706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,8,1,balanced,0.3638453483581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,8,1,power_law_1.01,0.349126410484314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,8,1,power_law_1.01,0.34920320510864256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,8,1,power_law_1.2,0.35676159858703616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,6144,2560,8,160,8,1,power_law_1.2,0.3570751905441284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,1,balanced,3.652864138285319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,1,balanced,3.690688133239746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,1,power_law_1.01,3.07128963470459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,1,power_law_1.01,3.1379840850830076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,1,power_law_1.2,3.0787071228027343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,1,power_law_1.2,3.2242752075195313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,128,balanced,0.19101333618164062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,128,balanced,0.19174933433532715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,128,power_law_1.01,0.18917759656906127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,128,power_law_1.01,0.18954880237579347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,128,power_law_1.2,0.188428795337677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,128,power_law_1.2,0.18982399702072145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,16,balanced,0.3896373510360718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,16,balanced,0.39047467708587646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,16,power_law_1.01,0.35921919345855713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,16,power_law_1.01,0.36494719982147217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,16,power_law_1.2,0.36138880252838135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,16,power_law_1.2,0.36491520404815675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,2,balanced,1.8975359598795574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,2,balanced,1.9109279314676921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,2,power_law_1.01,1.6124223709106444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,2,power_law_1.01,1.6413824081420898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,2,power_law_1.2,1.590003204345703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,2,power_law_1.2,1.6579072952270508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,256,balanced,0.18895999590555826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,256,balanced,0.18982400496800741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,256,power_law_1.01,0.1857151985168457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,256,power_law_1.01,0.18689919710159303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,256,power_law_1.2,0.1873792052268982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,256,power_law_1.2,0.18761600255966188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,32,balanced,0.25507734219233197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,32,balanced,0.2569599946339925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,32,power_law_1.01,0.2474368095397949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,32,power_law_1.01,0.25080320835113523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,32,power_law_1.2,0.23766400814056396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,32,power_law_1.2,0.2518719911575317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,4,balanced,0.9894933700561523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,4,balanced,0.9915040334065756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,4,power_law_1.01,0.8911040306091309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,4,power_law_1.01,0.8914431571960449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,4,power_law_1.2,0.8950783729553222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,4,power_law_1.2,0.9185024261474609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,64,balanced,0.2014453411102295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,64,balanced,0.203274667263031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,64,power_law_1.01,0.1984063982963562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,64,power_law_1.01,0.1985152006149292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,64,power_law_1.2,0.20016000270843506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,64,power_law_1.2,0.20069119930267335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,8,balanced,0.5886666774749756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,8,balanced,0.593610684076945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,8,power_law_1.01,0.505951976776123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,8,power_law_1.01,0.5605184078216553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,8,power_law_1.2,0.5639999866485595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,1,8,power_law_1.2,0.5802624225616455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,16,1,balanced,0.3815893332163493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,16,1,balanced,0.3818399906158447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,16,1,power_law_1.01,0.3173504114151001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,16,1,power_law_1.01,0.320249605178833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,16,1,power_law_1.2,0.32975358963012696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,16,1,power_law_1.2,0.3422080039978027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,2,1,balanced,1.816490650177002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,2,1,balanced,1.932634671529134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,2,1,power_law_1.01,1.5769023895263672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,2,1,power_law_1.01,1.609734344482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,2,1,power_law_1.2,1.593785572052002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,2,1,power_law_1.2,1.5947711944580079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,32,1,balanced,0.2627093394597371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,32,1,balanced,0.2638026674588521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,32,1,power_law_1.01,0.24677119255065919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,32,1,power_law_1.01,0.2474368095397949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,32,1,power_law_1.2,0.246995210647583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,32,1,power_law_1.2,0.251200008392334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,4,1,balanced,0.9422453244527181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,4,1,balanced,0.9438933531443278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,4,1,power_law_1.01,0.8392959594726562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,4,1,power_law_1.01,0.8605504035949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,4,1,power_law_1.2,0.846617603302002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,4,1,power_law_1.2,0.8501824378967285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,8,1,balanced,0.5579413175582886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,8,1,balanced,0.5616746743520101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,8,1,power_law_1.01,0.4864640235900879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,8,1,power_law_1.01,0.49719038009643557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,8,1,power_law_1.2,0.49431681632995605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,256,8,1,power_law_1.2,0.5061439990997314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,1,balanced,5.534655888875325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,1,balanced,5.564800262451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,1,power_law_1.01,4.211103820800782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,1,power_law_1.01,4.249792098999023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,1,power_law_1.2,4.308691024780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,1,power_law_1.2,4.334265518188476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,128,balanced,0.24257065852483115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,128,balanced,0.244053324063619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,128,power_law_1.01,0.23890559673309325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,128,power_law_1.01,0.24000000953674316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,128,power_law_1.2,0.23741440773010253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,128,power_law_1.2,0.23927679061889648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,16,balanced,0.5212800105412801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,16,balanced,0.524346669514974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,16,power_law_1.01,0.46803841590881345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,16,power_law_1.01,0.47484798431396485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,16,power_law_1.2,0.4611839771270752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,16,power_law_1.2,0.46126718521118165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,2,balanced,2.73911984761556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,2,balanced,2.7991838455200195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,2,power_law_1.01,2.2366912841796873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,2,power_law_1.01,2.2971775054931642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,2,power_law_1.2,2.227667236328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,2,power_law_1.2,2.2477760314941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,32,balanced,0.36421334743499756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,32,balanced,0.3654133478800456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,32,power_law_1.01,0.3206016063690186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,32,power_law_1.01,0.33832321166992185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,32,power_law_1.2,0.31988480091094973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,32,power_law_1.2,0.35482239723205566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,4,balanced,1.4574027061462402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,4,balanced,1.4656426111857097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,4,power_law_1.01,1.2463680267333985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,4,power_law_1.01,1.272435188293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,4,power_law_1.2,1.1760704040527343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,4,power_law_1.2,1.1976256370544434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,64,balanced,0.2662453254063924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,64,balanced,0.26895467440287274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,64,power_law_1.01,0.25553278923034667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,64,power_law_1.01,0.262604808807373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,64,power_law_1.2,0.2577984094619751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,64,power_law_1.2,0.2607487916946411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,8,balanced,0.8337600231170654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,8,balanced,0.8391679922739664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,8,power_law_1.01,0.7034560203552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,8,power_law_1.01,0.7807231903076172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,8,power_law_1.2,0.7037759780883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,1,8,power_law_1.2,0.7159488201141357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,16,1,balanced,0.4954773187637329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,16,1,balanced,0.4997386535008748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,16,1,power_law_1.01,0.43978238105773926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,16,1,power_law_1.01,0.4424448013305664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,16,1,power_law_1.2,0.43772158622741697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,16,1,power_law_1.2,0.43854718208312987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,2,1,balanced,2.788640022277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,2,1,balanced,2.7916320164998374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,2,1,power_law_1.01,2.180851173400879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,2,1,power_law_1.01,2.182822418212891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,2,1,power_law_1.2,2.148518371582031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,2,1,power_law_1.2,2.1900672912597656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,32,1,balanced,0.3580640157063802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,32,1,balanced,0.36026668548583984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,32,1,power_law_1.01,0.32115199565887453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,32,1,power_law_1.01,0.3212032079696655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,32,1,power_law_1.2,0.3169471979141235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,32,1,power_law_1.2,0.31775999069213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,4,1,balanced,1.3718345959981282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,4,1,balanced,1.407466729482015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,4,1,power_law_1.01,1.1270784378051757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,4,1,power_law_1.01,1.1484416007995606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,4,1,power_law_1.2,1.0991168022155762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,4,1,power_law_1.2,1.125068759918213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,8,1,balanced,0.7892213662465414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,8,1,balanced,0.7935413519541422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,8,1,power_law_1.01,0.6549183845520019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,8,1,power_law_1.01,0.6559552192687989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,8,1,power_law_1.2,0.6529280185699463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,256,7168,2048,8,384,8,1,power_law_1.2,0.6575744152069092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,1,balanced,0.4561440149943034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,1,balanced,0.45901334285736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,1,power_law_1.01,0.5582079887390137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,1,power_law_1.01,0.5583680152893067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,1,power_law_1.2,0.5676799774169922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,1,power_law_1.2,0.5788479804992676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,128,balanced,0.17965867122014365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,128,balanced,0.18050666650136313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,128,power_law_1.01,0.1907968044281006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,128,power_law_1.01,0.19352960586547852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,128,power_law_1.2,0.20322558879852295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,128,power_law_1.2,0.2032639980316162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,16,balanced,0.2014453411102295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,16,balanced,0.20155733823776245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,16,power_law_1.01,0.21633920669555665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,16,power_law_1.01,0.2196863889694214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,16,power_law_1.2,0.22736639976501466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,16,power_law_1.2,0.22875521183013917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,2,balanced,0.36905066172281903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,2,balanced,0.37118399143218994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,2,power_law_1.01,0.3905728101730347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,2,power_law_1.01,0.39356160163879395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,2,power_law_1.2,0.3993535995483398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,2,power_law_1.2,0.4194687843322754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,32,balanced,0.18929066260655722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,32,balanced,0.18940800428390503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,32,power_law_1.01,0.20726399421691893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,32,power_law_1.01,0.2079616069793701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,32,power_law_1.2,0.21361920833587647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,32,power_law_1.2,0.21388800144195558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,4,balanced,0.27384533484776813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,4,balanced,0.2748853365580241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,4,power_law_1.01,0.2987776041030884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,4,power_law_1.01,0.2998464107513428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,4,power_law_1.2,0.30846080780029295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,4,power_law_1.2,0.3198080062866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,64,balanced,0.18306666612625122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,64,balanced,0.18316799402236938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,64,power_law_1.01,0.19740159511566163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,64,power_law_1.01,0.19774719476699829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,64,power_law_1.2,0.20657920837402344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,64,power_law_1.2,0.210265588760376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,8,balanced,0.2267306645711263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,8,balanced,0.2274506688117981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,8,power_law_1.01,0.24683520793914795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,8,power_law_1.01,0.2523200035095215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,8,power_law_1.2,0.25642240047454834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,1,8,power_law_1.2,0.2564800024032593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,2,1,balanced,0.3338559865951538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,2,1,balanced,0.3359626531600952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,2,1,power_law_1.01,0.345414400100708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,2,1,power_law_1.01,0.34851200580596925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,2,1,power_law_1.2,0.3512511968612671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,2,1,power_law_1.2,0.35224959850311277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,4,1,balanced,0.23870933055877686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,4,1,balanced,0.24001065889994302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,4,1,power_law_1.01,0.24970879554748535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,4,1,power_law_1.01,0.25039360523223875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,4,1,power_law_1.2,0.252128005027771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2048,768,8,128,4,1,power_law_1.2,0.25258240699768064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,1,balanced,1.1723679701487224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,1,balanced,1.1889920234680176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,1,power_law_1.01,1.1376192092895507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,1,power_law_1.01,1.150937557220459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,1,power_law_1.2,1.1876928329467773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,1,power_law_1.2,1.1918144226074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,128,balanced,0.23839465777079263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,128,balanced,0.24115200837453207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,128,power_law_1.01,0.2614847898483276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,128,power_law_1.01,0.2679680109024048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,128,power_law_1.2,0.27991681098937987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,128,power_law_1.2,0.2919935941696167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,16,balanced,0.3025386730829875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,16,balanced,0.3026026686032613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,16,power_law_1.01,0.33930881023406984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,16,power_law_1.01,0.34189438819885254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,16,power_law_1.2,0.3453439950942993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,16,power_law_1.2,0.3671168088912964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,2,balanced,0.7772640387217203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,2,balanced,0.7804000377655029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,2,power_law_1.01,0.7575168132781982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,2,power_law_1.01,0.7828800201416015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,2,power_law_1.2,0.7952576160430909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,2,power_law_1.2,0.8061823844909668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,32,balanced,0.2648106614748637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,32,balanced,0.26528533299763996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,32,power_law_1.01,0.29402880668640136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,32,power_law_1.01,0.29678080081939695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,32,power_law_1.2,0.3101183891296387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,32,power_law_1.2,0.31371519565582273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,4,balanced,0.5107839902242025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,4,balanced,0.512223998705546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,4,power_law_1.01,0.5257664203643799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,4,power_law_1.01,0.5348608016967773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,4,power_law_1.2,0.5415103912353516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,4,power_law_1.2,0.5486976146697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,64,balanced,0.24715199073155722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,64,balanced,0.24861333767573038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,64,power_law_1.01,0.2718463897705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,64,power_law_1.01,0.27777919769287107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,64,power_law_1.2,0.2961280107498169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,64,power_law_1.2,0.2999808073043823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,8,balanced,0.37373868624369305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,8,balanced,0.37546666463216144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,8,power_law_1.01,0.3878528118133545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,8,power_law_1.01,0.3878976106643677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,8,power_law_1.2,0.41718401908874514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,1,8,power_law_1.2,0.42942080497741697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,16,1,balanced,0.5420373280843099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,16,1,balanced,0.5429013172785441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,16,1,power_law_1.01,0.5154560089111329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,16,1,power_law_1.01,0.5158847808837891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,16,1,power_law_1.2,0.5252799987792969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,16,1,power_law_1.2,0.5285120010375977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,2,1,balanced,0.7438879807790121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,2,1,balanced,0.7450293699900309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,2,1,power_law_1.01,0.7068927764892579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,2,1,power_law_1.01,0.7105408191680909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,2,1,power_law_1.2,0.7291647911071777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,2,1,power_law_1.2,0.7310272216796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,32,1,balanced,0.43718401590983075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,32,1,balanced,0.43808531761169434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,32,1,power_law_1.01,0.4145343780517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,32,1,power_law_1.01,0.41821441650390623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,32,1,power_law_1.2,0.42529921531677245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,32,1,power_law_1.2,0.4270016193389893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,4,1,balanced,0.4676053524017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,4,1,balanced,0.468666672706604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,4,1,power_law_1.01,0.45063037872314454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,4,1,power_law_1.01,0.45101442337036135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,4,1,power_law_1.2,0.4606143951416016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,4,1,power_law_1.2,0.46248321533203124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,8,1,balanced,0.6905279954274496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,8,1,balanced,0.6907680034637451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,8,1,power_law_1.01,0.6559167861938476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,8,1,power_law_1.01,0.6570816040039062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,8,1,power_law_1.2,0.6706816196441651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,2688,1856,6,128,8,1,power_law_1.2,0.6718976020812988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,1,balanced,1.6012639999389648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,1,balanced,1.6445919672648113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,1,power_law_1.01,1.8517951965332031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,1,power_law_1.01,1.8994560241699219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,1,power_law_1.2,1.954591941833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,1,power_law_1.2,1.9836544036865233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,128,balanced,0.29768532514572144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,128,balanced,0.29897600412368774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,128,power_law_1.01,0.32119040489196776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,128,power_law_1.01,0.3246335983276367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,128,power_law_1.2,0.3428544044494629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,128,power_law_1.2,0.34303998947143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,16,balanced,0.37195734182993573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,16,balanced,0.3723413149515788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,16,power_law_1.01,0.4232895851135254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,16,power_law_1.01,0.423635196685791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,16,power_law_1.2,0.43632001876831056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,16,power_law_1.2,0.43787522315979005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,2,balanced,0.9530613422393799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,2,balanced,0.9584320386250814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,2,power_law_1.01,1.1179648399353028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,2,power_law_1.01,1.1326144218444825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,2,power_law_1.2,1.1608320236206056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,2,power_law_1.2,1.1664511680603027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,256,balanced,0.29569600025812787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,256,balanced,0.29572800795237225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,256,power_law_1.01,0.31178879737854004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,256,power_law_1.01,0.3125375986099243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,256,power_law_1.2,0.3254784107208252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,256,power_law_1.2,0.32602880001068113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,32,balanced,0.3258133331934611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,32,balanced,0.3264213403065999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,32,power_law_1.01,0.36447360515594485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,32,power_law_1.01,0.36481919288635256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,32,power_law_1.2,0.3951936006546021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,32,power_law_1.2,0.39799039363861083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,4,balanced,0.6276053190231323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,4,balanced,0.6276266574859619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,4,power_law_1.01,0.7324096202850342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,4,power_law_1.01,0.7447936058044433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,4,power_law_1.2,0.7544703960418702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,4,power_law_1.2,0.7654528141021728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,64,balanced,0.3051786621411641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,64,balanced,0.30593599875768024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,64,power_law_1.01,0.3375999927520752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,64,power_law_1.01,0.34025599956512453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,64,power_law_1.2,0.3554879903793335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,64,power_law_1.2,0.35641601085662844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,8,balanced,0.4554986556371053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,8,balanced,0.4573226769765218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,8,power_law_1.01,0.5274112224578857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,8,power_law_1.01,0.5323584079742432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,8,power_law_1.2,0.5476416110992431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,1,8,power_law_1.2,0.5561728000640869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,16,1,balanced,0.3124213417371114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,16,1,balanced,0.31249066193898517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,16,1,power_law_1.01,0.36469759941101076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,16,1,power_law_1.01,0.3656447887420654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,16,1,power_law_1.2,0.37150719165802004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,16,1,power_law_1.2,0.3745408058166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,2,1,balanced,0.8954559961954752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,2,1,balanced,0.8954986731211344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,2,1,power_law_1.01,1.0450240135192872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,2,1,power_law_1.01,1.0614080429077148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,2,1,power_law_1.2,1.0889599800109864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,2,1,power_law_1.2,1.0911231994628907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,32,1,balanced,0.2609120011329651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,32,1,balanced,0.2627306580543518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,32,1,power_law_1.01,0.3095423936843872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,32,1,power_law_1.01,0.31052799224853517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,32,1,power_law_1.2,0.3145663976669312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,32,1,power_law_1.2,0.31648640632629393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,4,1,balanced,0.5505706469217936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,4,1,balanced,0.550927996635437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,4,1,power_law_1.01,0.6332672119140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,4,1,power_law_1.01,0.6387968063354492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,4,1,power_law_1.2,0.6589248180389404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,4,1,power_law_1.2,0.6677951812744141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,8,1,balanced,0.38072001934051514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,8,1,balanced,0.3818560043970744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,8,1,power_law_1.01,0.4338111877441406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,8,1,power_law_1.01,0.4366015911102295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,8,1,power_law_1.2,0.45532798767089844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,3072,1536,8,256,8,1,power_law_1.2,0.4652544021606445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,1,balanced,2.545599937438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,1,balanced,2.594154675801595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,1,power_law_1.01,2.6783552169799805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,1,power_law_1.01,2.720294380187988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,1,power_law_1.2,2.6771520614624023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,1,power_law_1.2,2.68417911529541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,2,balanced,1.4283413887023926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,2,balanced,1.4367893536885579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,2,power_law_1.01,1.9284608840942383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,2,power_law_1.01,1.9939840316772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,2,power_law_1.2,1.9645055770874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,2,power_law_1.2,1.9658432006835938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,4,balanced,0.9110879898071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,4,balanced,0.9111253420511881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,4,power_law_1.01,1.4516160011291503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,4,power_law_1.01,1.6100927352905274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,4,power_law_1.2,1.53504638671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,4,power_law_1.2,1.7092672348022462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,8,balanced,0.621674656867981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,8,balanced,0.6231146653493246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,8,power_law_1.01,1.257408046722412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,8,power_law_1.01,1.341702365875244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,8,power_law_1.2,1.3282431602478026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,1,8,power_law_1.2,1.3347071647644042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,16,1,balanced,0.238319993019104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,16,1,balanced,0.23863466580708823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,16,1,power_law_1.01,0.24208641052246094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,16,1,power_law_1.01,0.24442880153656005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,16,1,power_law_1.2,0.2447808027267456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,16,1,power_law_1.2,0.24554240703582764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,2,1,balanced,1.281872034072876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,2,1,balanced,1.2937013308207195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,2,1,power_law_1.01,1.3358464241027832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,2,1,power_law_1.01,1.3569024085998536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,2,1,power_law_1.2,1.3305600166320801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,2,1,power_law_1.2,1.3425024032592774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,32,1,balanced,0.1726026733716329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,32,1,balanced,0.17411200205485025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,32,1,power_law_1.01,0.1738368034362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,32,1,power_law_1.01,0.1770560026168823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,32,1,power_law_1.2,0.17570559978485106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,32,1,power_law_1.2,0.176147198677063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,4,1,balanced,0.6787892977396647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,4,1,balanced,0.6824106375376383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,4,1,power_law_1.01,0.7032127857208252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,4,1,power_law_1.01,0.7110079765319824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,4,1,power_law_1.2,0.7056896209716796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,4,1,power_law_1.2,0.7103807926177979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,8,1,balanced,0.37404799461364746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,8,1,balanced,0.37592534224192303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,8,1,power_law_1.01,0.38753280639648435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,8,1,power_law_1.01,0.3886591911315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,8,1,power_law_1.2,0.3864703893661499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,14336,2,8,8,1,power_law_1.2,0.3922431945800781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,1,balanced,1.6649279594421387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,1,balanced,1.6717012723286946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,1,power_law_1.01,1.7385343551635741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,1,power_law_1.01,1.7592256546020508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,1,power_law_1.2,1.7770368576049804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,1,power_law_1.2,1.8108991622924804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,128,balanced,0.3094240029652913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,128,balanced,0.3095093369483948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,128,power_law_1.01,0.3509567975997925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,128,power_law_1.01,0.353600001335144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,128,power_law_1.2,0.3830080032348633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,128,power_law_1.2,0.3969023942947388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,16,balanced,0.3831253449122111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,16,balanced,0.385535995165507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,16,power_law_1.01,0.45080318450927737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,16,power_law_1.01,0.46852478981018064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,16,power_law_1.2,0.48474879264831544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,16,power_law_1.2,0.5113215923309327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,2,balanced,0.9963413079579672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,2,balanced,1.0004053115844727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,2,power_law_1.01,1.0853823661804198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,2,power_law_1.01,1.1078783988952636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,2,power_law_1.2,1.120697593688965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,2,power_law_1.2,1.1325311660766602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,32,balanced,0.33887465794881183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,32,balanced,0.33984533945719403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,32,power_law_1.01,0.40176000595092776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,32,power_law_1.01,0.4052735805511475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,32,power_law_1.2,0.4311999797821045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,32,power_law_1.2,0.4385791778564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,4,balanced,0.6467359860738119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,4,balanced,0.6468533277511597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,4,power_law_1.01,0.7287487983703613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,4,power_law_1.01,0.729478406906128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,4,power_law_1.2,0.722815990447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,4,power_law_1.2,0.744761610031128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,64,balanced,0.31668267647425336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,64,balanced,0.31804800033569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,64,power_law_1.01,0.36092801094055177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,64,power_law_1.01,0.36764159202575686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,64,power_law_1.2,0.3998528003692627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,64,power_law_1.2,0.4002431869506836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,8,balanced,0.4726080099741618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,8,balanced,0.4732746680577596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,8,power_law_1.01,0.5682623863220215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,8,power_law_1.01,0.5693056106567382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,8,power_law_1.2,0.5625664234161377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,1,8,power_law_1.2,0.5708032131195069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,16,1,balanced,0.3546080191930135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,16,1,balanced,0.35470398267110187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,16,1,power_law_1.01,0.37098240852355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,16,1,power_law_1.01,0.3717119932174683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,16,1,power_law_1.2,0.3723328113555908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,16,1,power_law_1.2,0.3731071949005127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,2,1,balanced,0.8164213498433431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,2,1,balanced,0.820138692855835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,2,1,power_law_1.01,0.9891008377075196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,2,1,power_law_1.01,0.9907903671264648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,2,1,power_law_1.2,1.029971218109131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,2,1,power_law_1.2,1.0313023567199706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,32,1,balanced,0.2978079915046692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,32,1,balanced,0.2988319993019104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,32,1,power_law_1.01,0.3099391937255859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,32,1,power_law_1.01,0.3104640007019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,32,1,power_law_1.2,0.3113919973373413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,32,1,power_law_1.2,0.31252479553222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,4,1,balanced,0.5973493258158366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,4,1,balanced,0.5991359949111938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,4,1,power_law_1.01,0.6208320140838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,4,1,power_law_1.01,0.6208767890930176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,4,1,power_law_1.2,0.6306879997253418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,4,1,power_law_1.2,0.6338751792907715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,8,1,balanced,0.42265601952870685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,8,1,balanced,0.42326398690541583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,8,1,power_law_1.01,0.43837437629699705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,8,1,power_law_1.01,0.4403200149536133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,8,1,power_law_1.2,0.44303359985351565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,1536,8,128,8,1,power_law_1.2,0.444217586517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,1,balanced,11.759877522786459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,1,balanced,12.39465077718099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,1,power_law_1.01,10.612671661376954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,1,power_law_1.01,10.940831756591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,1,power_law_1.2,11.070758056640624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,1,power_law_1.2,11.602623748779298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,128,balanced,1.1327306429545085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,128,balanced,1.1335840225219727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,128,power_law_1.01,1.2136256217956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,128,power_law_1.01,1.2150976181030273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,128,power_law_1.2,1.2446016311645507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,128,power_law_1.2,1.2583999633789062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,16,balanced,1.656943957010905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,16,balanced,1.6593012809753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,16,power_law_1.01,1.7387008666992188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,16,power_law_1.01,1.7528511047363282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,16,power_law_1.2,1.7912704467773437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,16,power_law_1.2,1.8412416458129883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,2,balanced,6.357781092325847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,2,balanced,6.46562131245931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,2,power_law_1.01,5.919577789306641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,2,power_law_1.01,6.03831672668457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,2,power_law_1.2,6.089823913574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,2,power_law_1.2,6.233119964599609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,256,balanced,1.0905813376108806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,256,balanced,1.0929439862569172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,256,power_law_1.01,1.1500864028930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,256,power_law_1.01,1.1763520240783691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,256,power_law_1.2,1.2086848258972167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,256,power_law_1.2,1.2101247787475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,32,balanced,1.3521226247151692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,32,balanced,1.3543893496195476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,32,power_law_1.01,1.459059238433838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,32,power_law_1.01,1.4831616401672363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,32,power_law_1.2,1.482316780090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,32,power_law_1.2,1.5598655700683595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,4,balanced,3.520719846089681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,4,balanced,3.576767921447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,4,power_law_1.01,3.4810176849365235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,4,power_law_1.01,3.4957374572753905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,4,power_law_1.2,3.4953216552734374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,4,power_law_1.2,3.593868637084961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,64,balanced,1.2057440280914307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,64,balanced,1.2072693506876628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,64,power_law_1.01,1.2790335655212401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,64,power_law_1.01,1.2860095977783204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,64,power_law_1.2,1.3618559837341309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,64,power_law_1.2,1.3766976356506349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,8,balanced,2.264047940572103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,8,balanced,2.268496036529541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,8,power_law_1.01,2.300345611572266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,8,power_law_1.01,2.3290624618530273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,8,power_law_1.2,2.4403839111328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,1,8,power_law_1.2,2.45034236907959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,16,1,balanced,3.220149358113607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,16,1,balanced,3.2251412073771157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,16,1,power_law_1.01,2.934867286682129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,16,1,power_law_1.01,2.938150405883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,16,1,power_law_1.2,2.9937280654907226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,16,1,power_law_1.2,3.0027584075927733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,2,1,balanced,5.3335520426432295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,2,1,balanced,5.404095967610677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,2,1,power_law_1.01,4.729459381103515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,2,1,power_law_1.01,4.851935958862304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,2,1,power_law_1.2,4.877510452270508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,2,1,power_law_1.2,4.969996643066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,32,1,balanced,2.8199199040730796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,32,1,balanced,2.821002642313639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,32,1,power_law_1.01,2.5538496017456054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,32,1,power_law_1.01,2.571187210083008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,32,1,power_law_1.2,2.626412773132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,32,1,power_law_1.2,2.6320959091186524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,4,1,balanced,6.903530756632487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,4,1,balanced,7.11024538675944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,4,1,power_law_1.01,6.871647644042969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,4,1,power_law_1.01,6.878752136230469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,4,1,power_law_1.2,6.674150085449218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,4,1,power_law_1.2,6.744057464599609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,8,1,balanced,2.063103993733724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,8,1,balanced,2.087402661641439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,8,1,power_law_1.01,1.8878080368041992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,8,1,power_law_1.01,1.8957183837890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,8,1,power_law_1.2,1.9184320449829102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,4096,2688,22,512,8,1,power_law_1.2,1.9321216583251952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,1,balanced,4.170991897583008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,1,balanced,4.4312747319539385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,1,power_law_1.01,4.422310256958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,1,power_law_1.01,4.595423889160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,1,power_law_1.2,4.274182510375977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,1,power_law_1.2,4.452710342407227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,2,balanced,2.2906880378723145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,2,balanced,2.3126880327860513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,2,power_law_1.01,2.9868288040161133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,2,power_law_1.01,3.1686527252197267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,2,power_law_1.2,2.9610240936279295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,2,power_law_1.2,3.129696083068848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,4,balanced,1.2584693431854248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,4,balanced,1.2703253428141277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,4,power_law_1.01,2.3328704833984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,4,power_law_1.01,2.4681728363037108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,4,power_law_1.2,2.345401573181152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,4,power_law_1.2,2.3464639663696287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,8,balanced,0.8118826548258463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,8,balanced,0.8134453296661377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,8,power_law_1.01,1.9809600830078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,8,power_law_1.01,1.9846656799316407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,8,power_law_1.2,1.7871551513671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,1,8,power_law_1.2,2.010886383056641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,16,1,balanced,0.3442506790161133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,16,1,balanced,0.344490647315979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,16,1,power_law_1.01,0.3591936111450195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,16,1,power_law_1.01,0.3647808074951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,16,1,power_law_1.2,0.3580735921859741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,16,1,power_law_1.2,0.35935359001159667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,2,1,balanced,2.0635679562886557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,2,1,balanced,2.15939728418986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,2,1,power_law_1.01,2.162335968017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,2,1,power_law_1.01,2.1990528106689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,2,1,power_law_1.2,2.1818111419677733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,2,1,power_law_1.2,2.2043903350830076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,32,1,balanced,0.2457759976387024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,32,1,balanced,0.24657066663106283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,32,1,power_law_1.01,0.25270400047302244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,32,1,power_law_1.01,0.2575232028961182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,32,1,power_law_1.2,0.2531071901321411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,32,1,power_law_1.2,0.2533760070800781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,4,1,balanced,1.0642986297607422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,4,1,balanced,1.1012159983317058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,4,1,power_law_1.01,1.1308223724365234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,4,1,power_law_1.01,1.1484992027282714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,4,1,power_law_1.2,1.1497088432312013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,4,1,power_law_1.2,1.1628864288330079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,8,1,balanced,0.5899146795272827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,8,1,balanced,0.5970400174458822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,8,1,power_law_1.01,0.6208384037017822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,8,1,power_law_1.01,0.624294376373291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,8,1,power_law_1.2,0.6180352210998535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,16384,2,8,8,1,power_law_1.2,0.6190656185150146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,1,balanced,4.0894880294799805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,1,balanced,4.147647857666016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,1,power_law_1.01,5.176287841796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,1,power_law_1.01,5.189337539672851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,1,power_law_1.2,5.055583953857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,1,power_law_1.2,5.381497573852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,128,balanced,0.48071467876434326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,128,balanced,0.4817440112431844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,128,power_law_1.01,0.5381887912750244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,128,power_law_1.01,0.5464320182800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,128,power_law_1.2,0.5768064022064209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,128,power_law_1.2,0.5786880016326904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,16,balanced,0.6696853637695312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,16,balanced,0.6741066773732504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,16,power_law_1.01,0.7839231967926026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,16,power_law_1.01,0.7974656105041504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,16,power_law_1.2,0.869222354888916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,16,power_law_1.2,0.8804351806640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,2,balanced,2.230133374532064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,2,balanced,2.3694400787353516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,2,power_law_1.01,2.649907112121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,2,power_law_1.01,2.7087488174438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,2,power_law_1.2,2.778054428100586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,2,power_law_1.2,2.928441619873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,256,balanced,0.47270401318868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,256,balanced,0.473749319712321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,256,power_law_1.01,0.5130368232727051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,256,power_law_1.01,0.5141056060791016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,256,power_law_1.2,0.5511551856994629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,256,power_law_1.2,0.5600959777832031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,32,balanced,0.5617920160293579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,32,balanced,0.5634080171585083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,32,power_law_1.01,0.6597824096679688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,32,power_law_1.01,0.6642047882080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,32,power_law_1.2,0.7019392013549804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,32,power_law_1.2,0.7055295944213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,4,balanced,1.3243253231048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,4,balanced,1.3432374000549316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,4,power_law_1.01,1.5697728157043458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,4,power_law_1.01,1.6083456039428712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,4,power_law_1.2,1.643552017211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,4,power_law_1.2,1.7191871643066405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,64,balanced,0.5033066670099894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,64,balanced,0.5043893257776896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,64,power_law_1.01,0.579315185546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,64,power_law_1.01,0.5916863918304444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,64,power_law_1.2,0.6180799961090088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,64,power_law_1.2,0.6201280117034912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,8,balanced,0.8859786987304688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,8,balanced,0.8868800004323324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,8,power_law_1.01,1.0827584266662598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,8,power_law_1.01,1.0985088348388672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,8,power_law_1.2,1.138374423980713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,1,8,power_law_1.2,1.155571174621582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,16,1,balanced,0.5799359877904257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,16,1,balanced,0.5829226573308309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,16,1,power_law_1.01,0.6773439884185791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,16,1,power_law_1.01,0.6782656192779541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,16,1,power_law_1.2,0.686297607421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,16,1,power_law_1.2,0.6948800086975098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,2,1,balanced,2.12605873743693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,2,1,balanced,2.1523893674214682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,2,1,power_law_1.01,2.5388927459716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,2,1,power_law_1.01,2.541267204284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,2,1,power_law_1.2,2.628595161437988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,2,1,power_law_1.2,2.689273643493652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,32,1,balanced,0.4761173327763875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,32,1,balanced,0.47619199752807617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,32,1,power_law_1.01,0.5678080081939697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,32,1,power_law_1.01,0.5699903964996338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,32,1,power_law_1.2,0.5808320045471191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,32,1,power_law_1.2,0.5824895858764648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,4,1,balanced,1.208778699239095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,4,1,balanced,1.2161386807759602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,4,1,power_law_1.01,1.4387007713317872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,4,1,power_law_1.01,1.4449536323547363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,4,1,power_law_1.2,1.5009087562561034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,4,1,power_law_1.2,1.5067584037780761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,8,1,balanced,0.7954186598459879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,8,1,balanced,0.7954826354980469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,8,1,power_law_1.01,0.9415936470031738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,8,1,power_law_1.01,0.9457663536071778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,8,1,power_law_1.2,0.9621952056884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2048,8,256,8,1,power_law_1.2,0.969753646850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,1,balanced,5.130085309346517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,1,balanced,5.230314572652181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,1,power_law_1.01,4.811014556884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,1,power_law_1.01,4.966777420043945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,1,power_law_1.2,4.909408187866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,1,power_law_1.2,5.285599899291992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,16,balanced,0.7159413496653239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,16,balanced,0.7197226683298746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,16,power_law_1.01,0.8187392234802247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,16,power_law_1.01,0.8542592048645019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,16,power_law_1.2,0.9302080154418946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,16,power_law_1.2,0.9626815795898438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,2,balanced,2.7085173924764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,2,balanced,2.8117758433024087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,2,power_law_1.01,2.6972671508789063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,2,power_law_1.01,2.805766487121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,2,power_law_1.2,2.8229631423950194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,2,power_law_1.2,2.831609535217285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,32,balanced,0.5862559874852499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,32,balanced,0.5868266820907593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,32,power_law_1.01,0.6892864227294921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,32,power_law_1.01,0.7291391849517822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,32,power_law_1.2,0.796614408493042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,32,power_law_1.2,0.7995584011077881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,4,balanced,1.531941254933675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,4,balanced,1.5429226557413738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,4,power_law_1.01,1.6229183197021484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,4,power_law_1.01,1.7219200134277344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,4,power_law_1.2,1.7015039443969726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,4,power_law_1.2,1.7180160522460937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,8,balanced,0.9789813359578451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,8,balanced,0.980725367863973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,8,power_law_1.01,1.0538559913635255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,8,power_law_1.01,1.0857536315917968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,8,power_law_1.2,1.1493120193481445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,1,8,power_law_1.2,1.236793613433838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,16,1,balanced,0.6844586531321207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,16,1,balanced,0.6857226689656576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,16,1,power_law_1.01,0.6790719985961914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,16,1,power_law_1.01,0.6814847946166992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,16,1,power_law_1.2,0.6857600212097168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,16,1,power_law_1.2,0.6900159835815429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,2,1,balanced,2.540426731109619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,2,1,balanced,2.631274700164795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,2,1,power_law_1.01,2.486867141723633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,2,1,power_law_1.01,2.4977855682373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,2,1,power_law_1.2,2.4611711502075195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,2,1,power_law_1.2,2.487033653259277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,32,1,balanced,0.5863519906997681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,32,1,balanced,0.5869173208872477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,32,1,power_law_1.01,0.5747903823852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,32,1,power_law_1.01,0.5781760215759277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,32,1,power_law_1.2,0.5867712020874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,32,1,power_law_1.2,0.5871039867401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,4,1,balanced,1.4170400301615398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,4,1,balanced,1.4292106628417969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,4,1,power_law_1.01,1.3896512031555175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,4,1,power_law_1.01,1.394918441772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,4,1,power_law_1.2,1.4223296165466308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,4,1,power_law_1.2,1.4278528213500976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,8,1,balanced,0.8952693144480387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,8,1,balanced,0.8957493305206299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,8,1,power_law_1.01,0.8875328063964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,8,1,power_law_1.01,0.8881535530090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,8,1,power_law_1.2,0.8947456359863282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,6144,2560,8,160,8,1,power_law_1.2,0.8987263679504395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,1,balanced,4.698111852010091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,1,balanced,4.779845237731934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,1,power_law_1.01,5.895129776000976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,1,power_law_1.01,6.053580856323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,1,power_law_1.2,6.146899032592773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,1,power_law_1.2,6.409855651855469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,128,balanced,0.5279893477757772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,128,balanced,0.5290826559066772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,128,power_law_1.01,0.6035071849822998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,128,power_law_1.01,0.6077184200286865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,128,power_law_1.2,0.6339327812194824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,128,power_law_1.2,0.6379968166351319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,16,balanced,0.7559359868367513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,16,balanced,0.7572373549143473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,16,power_law_1.01,0.898316764831543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,16,power_law_1.01,0.9123647689819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,16,power_law_1.2,0.9778880119323731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,16,power_law_1.2,0.9909503936767579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,2,balanced,2.777791976928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,2,balanced,2.8395039240519204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,2,power_law_1.01,3.2008384704589843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,2,power_law_1.01,3.264255905151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,2,power_law_1.2,3.321023941040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,2,power_law_1.2,3.4038974761962892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,256,balanced,0.5202240149180094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,256,balanced,0.5206240018208822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,256,power_law_1.01,0.5692224025726318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,256,power_law_1.01,0.5741439819335937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,256,power_law_1.2,0.6160639762878418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,256,power_law_1.2,0.6228096008300781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,32,balanced,0.6226773262023926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,32,balanced,0.6239093144734701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,32,power_law_1.01,0.7359039783477783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,32,power_law_1.01,0.7380799770355224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,32,power_law_1.2,0.7898240089416504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,32,power_law_1.2,0.8148927688598633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,4,balanced,1.5272960662841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,4,balanced,1.5357066790262859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,4,power_law_1.01,1.886662483215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,4,power_law_1.01,1.8902528762817383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,4,power_law_1.2,1.969375991821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,4,power_law_1.2,2.0218175888061523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,64,balanced,0.5548373460769653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,64,balanced,0.5578293402989706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,64,power_law_1.01,0.6584832191467285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,64,power_law_1.01,0.6629631996154786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,64,power_law_1.2,0.7120448112487793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,64,power_law_1.2,0.7293759822845459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,8,balanced,1.0032800038655598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,8,balanced,1.0044746398925781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,8,power_law_1.01,1.2165887832641602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,8,power_law_1.01,1.225126361846924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,8,power_law_1.2,1.275430393218994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,1,8,power_law_1.2,1.3278271675109863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,16,1,balanced,0.6695893605550131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,16,1,balanced,0.6710293292999268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,16,1,power_law_1.01,0.782585620880127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,16,1,power_law_1.01,0.7858431816101075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,16,1,power_law_1.2,0.7931007862091064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,16,1,power_law_1.2,0.8007040023803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,2,1,balanced,2.5183733304341636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,2,1,balanced,2.648757298787435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,2,1,power_law_1.01,3.0257535934448243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,2,1,power_law_1.01,3.0677631378173826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,2,1,power_law_1.2,3.080134391784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,2,1,power_law_1.2,3.1102975845336913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,32,1,balanced,0.5462239980697632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,32,1,balanced,0.5468693176905314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,32,1,power_law_1.01,0.6583295822143554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,32,1,power_law_1.01,0.6609216213226319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,32,1,power_law_1.2,0.667091178894043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,32,1,power_law_1.2,0.6693696022033692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,4,1,balanced,1.3974827130635579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,4,1,balanced,1.4286826451619465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,4,1,power_law_1.01,1.6765823364257812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,4,1,power_law_1.01,1.6838720321655274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,4,1,power_law_1.2,1.7375360488891602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,4,1,power_law_1.2,1.7528192520141601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,8,1,balanced,0.922714630762736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,8,1,balanced,0.9239359696706136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,8,1,power_law_1.01,1.0816960334777832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,8,1,power_law_1.01,1.0985407829284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,8,1,power_law_1.2,1.1187135696411132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,256,8,1,power_law_1.2,1.1187520027160645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,1,balanced,6.868634541829427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,1,balanced,6.968736012776692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,1,power_law_1.01,7.392755126953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,1,power_law_1.01,7.566835021972656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,1,power_law_1.2,7.835469055175781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,1,power_law_1.2,8.109177398681641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,128,balanced,0.5979946851730347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,128,balanced,0.6005173524220785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,128,power_law_1.01,0.6492544174194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,128,power_law_1.01,0.6548736095428467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,128,power_law_1.2,0.6903999805450439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,128,power_law_1.2,0.7180352210998535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,16,balanced,0.9249493281046549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,16,balanced,0.9265600045522054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,16,power_law_1.01,1.02291841506958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,16,power_law_1.01,1.0396224021911622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,16,power_law_1.2,1.0698559761047364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,16,power_law_1.2,1.1137984275817872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,2,balanced,3.7650559743245444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,2,balanced,3.8652480443318686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,2,power_law_1.01,4.052127838134766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,2,power_law_1.01,4.1345985412597654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,2,power_law_1.2,4.17462387084961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,2,power_law_1.2,4.17509765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,32,balanced,0.7459680239359537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,32,balanced,0.7466826438903809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,32,power_law_1.01,0.8173952102661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,32,power_law_1.01,0.8210304260253907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,32,power_law_1.2,0.8623680114746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,32,power_law_1.2,0.887724781036377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,4,balanced,2.052031993865967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,4,balanced,2.0555787086486816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,4,power_law_1.01,2.2394687652587892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,4,power_law_1.01,2.2415935516357424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,4,power_law_1.2,2.333171272277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,4,power_law_1.2,2.368684768676758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,64,balanced,0.645413319269816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,64,balanced,0.6454399824142456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,64,power_law_1.01,0.7030399799346924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,64,power_law_1.01,0.7117248058319092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,64,power_law_1.2,0.726803207397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,64,power_law_1.2,0.7513216018676758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,8,balanced,1.3080426851908367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,8,balanced,1.3090559641520183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,8,power_law_1.01,1.4265407562255858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,8,power_law_1.01,1.4426176071166992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,8,power_law_1.2,1.4916735649108888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,1,8,power_law_1.2,1.5488191604614259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,16,1,balanced,0.8779093424479166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,16,1,balanced,0.8786773681640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,16,1,power_law_1.01,0.9593024253845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,16,1,power_law_1.01,0.9606399536132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,16,1,power_law_1.2,0.981107234954834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,16,1,power_law_1.2,0.9829504013061523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,2,1,balanced,3.6284427642822266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,2,1,balanced,3.647120157877604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,2,1,power_law_1.01,3.73741455078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,2,1,power_law_1.01,3.751398468017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,2,1,power_law_1.2,3.974553680419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,2,1,power_law_1.2,4.025568008422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,32,1,balanced,0.7258613109588623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,32,1,balanced,0.7272053559621176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,32,1,power_law_1.01,0.7496960163116455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,32,1,power_law_1.01,0.7573631763458252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,32,1,power_law_1.2,0.7737664222717285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,32,1,power_law_1.2,0.7740608215332031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,4,1,balanced,1.9619359970092773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,4,1,balanced,1.9678880373636882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,4,1,power_law_1.01,2.0649152755737306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,4,1,power_law_1.01,2.0714176177978514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,4,1,power_law_1.2,2.175833511352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,4,1,power_law_1.2,2.2062400817871093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,8,1,balanced,1.2487040360768635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,8,1,balanced,1.2505546410878499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,8,1,power_law_1.01,1.3241279602050782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,8,1,power_law_1.01,1.3241663932800294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,8,1,power_law_1.2,1.3602047920227052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,3072,7168,2048,8,384,8,1,power_law_1.2,1.3679488182067872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,1,balanced,0.20654932657877603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,1,balanced,0.20732800165812174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,1,power_law_1.01,0.17478400468826294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,1,power_law_1.01,0.17571840286254883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,1,power_law_1.2,0.17571200132369996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,1,power_law_1.2,0.17786240577697754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,128,balanced,0.02922133356332779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,128,balanced,0.0314026673634847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,128,power_law_1.01,0.029254400730133058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,128,power_law_1.01,0.029286399483680725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,128,power_law_1.2,0.02881920039653778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,128,power_law_1.2,0.028883200883865357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,16,balanced,0.03763733307520548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,16,balanced,0.03790933390458425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,16,power_law_1.01,0.03549439907073974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,16,power_law_1.01,0.036499199271202085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,16,power_law_1.2,0.035392001271247864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,16,power_law_1.2,0.0367680013179779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,2,balanced,0.1277653376261393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,2,balanced,0.13637866576512656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,2,power_law_1.01,0.11063679456710815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,2,power_law_1.01,0.11581439971923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,2,power_law_1.2,0.11020159721374512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,2,power_law_1.2,0.11342719793319703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,32,balanced,0.03233066697915395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,32,balanced,0.032655999064445496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,32,power_law_1.01,0.030291199684143066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,32,power_law_1.01,0.030502399802207945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,32,power_law_1.2,0.030425599217414855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,32,power_law_1.2,0.030803200602531434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,4,balanced,0.07930133243401845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,4,balanced,0.08111466467380524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,4,power_law_1.01,0.07460479736328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,4,power_law_1.01,0.07468159794807434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,4,power_law_1.2,0.07244799733161926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,4,power_law_1.2,0.07363839745521546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,64,balanced,0.0312266672650973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,64,balanced,0.031386665999889374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,64,power_law_1.01,0.02956160008907318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,64,power_law_1.01,0.029900801181793214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,64,power_law_1.2,0.02937600016593933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,64,power_law_1.2,0.02999039888381958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,8,balanced,0.05406400064627329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,8,balanced,0.05566399792830149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,8,power_law_1.01,0.05041279792785645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,8,power_law_1.01,0.05092480182647705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,8,power_law_1.2,0.048640000820159915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,1,8,power_law_1.2,0.051571202278137204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,2,1,balanced,0.13378133376439413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,2,1,balanced,0.13410133123397827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,2,1,power_law_1.01,0.1126911997795105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,2,1,power_law_1.01,0.11373440027236939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,2,1,power_law_1.2,0.11134079694747925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,2,1,power_law_1.2,0.11326719522476196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,4,1,balanced,0.09356799721717834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,4,1,balanced,0.09464533130327861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,4,1,power_law_1.01,0.08311039805412293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,4,1,power_law_1.01,0.08454399704933166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,4,1,power_law_1.2,0.08367999792098998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2048,768,8,128,4,1,power_law_1.2,0.08513280153274536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,1,balanced,0.5752906799316406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,1,balanced,0.5784906546274821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,1,power_law_1.01,0.44323201179504396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,1,power_law_1.01,0.44576001167297363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,1,power_law_1.2,0.45314559936523435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,1,power_law_1.2,0.4553215980529785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,128,balanced,0.03573333223660787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,128,balanced,0.03603733330965042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,128,power_law_1.01,0.03399679958820343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,128,power_law_1.01,0.03418880105018616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,128,power_law_1.2,0.03441919982433319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,128,power_law_1.2,0.034534400701522826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,16,balanced,0.0724373310804367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,16,balanced,0.07253333429495494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,16,power_law_1.01,0.06488959789276123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,16,power_law_1.01,0.0667967975139618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,16,power_law_1.2,0.0630079984664917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,16,power_law_1.2,0.06409599781036376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,2,balanced,0.3147733410199483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,2,balanced,0.3165760040283203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,2,power_law_1.01,0.2630784034729004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,2,power_law_1.01,0.27141120433807375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,2,power_law_1.2,0.2538367986679077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,2,power_law_1.2,0.254803204536438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,32,balanced,0.049685334165891014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,32,balanced,0.05178666611512502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,32,power_law_1.01,0.0474368005990982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,32,power_law_1.01,0.04747520089149475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,32,power_law_1.2,0.04839679896831513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,32,power_law_1.2,0.048979198932647704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,4,balanced,0.18174399932225546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,4,balanced,0.18227199713389078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,4,power_law_1.01,0.14305919408798218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,4,power_law_1.01,0.15468159914016724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,4,power_law_1.2,0.1472383975982666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,4,power_law_1.2,0.15740159749984742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,64,balanced,0.039034667114416756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,64,balanced,0.039461334546407066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,64,power_law_1.01,0.03811199963092804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,64,power_law_1.01,0.03829120099544525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,64,power_law_1.2,0.03764480054378509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,64,power_law_1.2,0.03788160085678101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,8,balanced,0.1106773316860199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,8,balanced,0.11089066664377849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,8,power_law_1.01,0.09419519901275634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,8,power_law_1.01,0.09616000056266785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,8,power_law_1.2,0.09307519793510437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,1,8,power_law_1.2,0.09895679950714112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,16,1,balanced,0.2281279961268107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,16,1,balanced,0.23221333821614584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,16,1,power_law_1.01,0.1695039987564087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,16,1,power_law_1.01,0.17197439670562745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,16,1,power_law_1.2,0.17060480117797852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,16,1,power_law_1.2,0.17228800058364868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,2,1,balanced,0.3199839989344279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,2,1,balanced,0.3202666640281677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,2,1,power_law_1.01,0.25509119033813477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,2,1,power_law_1.01,0.25680639743804934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,2,1,power_law_1.2,0.25114240646362307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,2,1,power_law_1.2,0.2539391994476318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,32,1,balanced,0.20683733622233072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,32,1,balanced,0.20731200774510702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,32,1,power_law_1.01,0.15924479961395263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,32,1,power_law_1.01,0.16028159856796265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,32,1,power_law_1.2,0.1577023983001709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,32,1,power_law_1.2,0.1579519987106323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,4,1,balanced,0.19525333245595297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,4,1,balanced,0.19714132944742838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,4,1,power_law_1.01,0.15567359924316407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,4,1,power_law_1.01,0.15750399827957154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,4,1,power_law_1.2,0.15527679920196533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,4,1,power_law_1.2,0.15763839483261108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,8,1,balanced,0.2813599904378255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,8,1,balanced,0.2816320061683655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,8,1,power_law_1.01,0.215065598487854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,8,1,power_law_1.01,0.21704320907592772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,8,1,power_law_1.2,0.2134399890899658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,2688,1856,6,128,8,1,power_law_1.2,0.21466879844665526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,1,balanced,1.0432799657185872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,1,balanced,1.0447680155436199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,1,power_law_1.01,0.5331647872924805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,1,power_law_1.01,0.5526463985443115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,1,power_law_1.2,0.5044095993041993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,1,power_law_1.2,0.5207680225372314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,128,balanced,0.04560533165931702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,128,balanced,0.04574400186538696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,128,power_law_1.01,0.04446719884872437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,128,power_law_1.01,0.04459519982337952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,128,power_law_1.2,0.044275200366973876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,128,power_law_1.2,0.04508160054683685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,16,balanced,0.11061867078145345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,16,balanced,0.11117866635322571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,16,power_law_1.01,0.09823359847068787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,16,power_law_1.01,0.10119040012359619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,16,power_law_1.2,0.08495360016822814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,16,power_law_1.2,0.09290879964828491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,2,balanced,0.5482186476389567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,2,balanced,0.5482986768086752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,2,power_law_1.01,0.3047616004943848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,2,power_law_1.01,0.30794880390167234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,2,power_law_1.2,0.27650558948516846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,2,power_law_1.2,0.2861696004867554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,256,balanced,0.043509334325790405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,256,balanced,0.04397333165009817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,256,power_law_1.01,0.041766399145126344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,256,power_law_1.01,0.042131200432777405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,256,power_law_1.2,0.04186240136623383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,256,power_law_1.2,0.04211199879646301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,32,balanced,0.07833600044250488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,32,balanced,0.07852266728878021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,32,power_law_1.01,0.06713600158691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,32,power_law_1.01,0.06714879870414733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,32,power_law_1.2,0.06298879981040954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,32,power_law_1.2,0.07096959948539734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,4,balanced,0.31062932809193927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,4,balanced,0.31272000074386597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,4,power_law_1.01,0.21659519672393798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,4,power_law_1.01,0.22291839122772217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,4,power_law_1.2,0.1945472002029419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,4,power_law_1.2,0.1958080053329468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,64,balanced,0.05580266813437144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,64,balanced,0.05604266623655955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,64,power_law_1.01,0.052288001775741576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,64,power_law_1.01,0.05372160077095032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,64,power_law_1.2,0.049497601389884946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,64,power_law_1.2,0.04982399940490723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,8,balanced,0.17549333969751993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,8,balanced,0.1771199901898702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,8,power_law_1.01,0.16121599674224854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,8,power_law_1.01,0.16376960277557373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,8,power_law_1.2,0.13586560487747193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,1,8,power_law_1.2,0.16128640174865722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,16,1,balanced,0.16251200437545776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,16,1,balanced,0.1647040049235026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,16,1,power_law_1.01,0.09655680060386658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,16,1,power_law_1.01,0.09982720017433167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,16,1,power_law_1.2,0.09218559861183166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,16,1,power_law_1.2,0.09290879964828491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,2,1,balanced,0.5523893435796102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,2,1,balanced,0.5725333293279012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,2,1,power_law_1.01,0.2964864015579224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,2,1,power_law_1.01,0.2997503995895386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,2,1,power_law_1.2,0.27234559059143065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,2,1,power_law_1.2,0.2823424100875854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,32,1,balanced,0.15001599987347922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,32,1,balanced,0.15119466185569763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,32,1,power_law_1.01,0.08749439716339111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,32,1,power_law_1.01,0.08894079923629761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,32,1,power_law_1.2,0.08130559921264649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,32,1,power_law_1.2,0.08311039805412293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,4,1,balanced,0.3262186646461487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,4,1,balanced,0.32655467589696247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,4,1,power_law_1.01,0.18339840173721314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,4,1,power_law_1.01,0.18785279989242554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,4,1,power_law_1.2,0.16871039867401122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,4,1,power_law_1.2,0.17704960107803344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,8,1,balanced,0.2267733414967855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,8,1,balanced,0.2281066576639811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,8,1,power_law_1.01,0.13022719621658324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,8,1,power_law_1.01,0.13175040483474731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,8,1,power_law_1.2,0.12296960353851319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,3072,1536,8,256,8,1,power_law_1.2,0.1232192039489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,1,balanced,0.48152534166971844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,1,balanced,0.4832693338394165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,1,power_law_1.01,0.47324161529541015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,1,power_law_1.01,0.5082943916320801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,1,power_law_1.2,0.4915520191192627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,1,power_law_1.2,0.5192704200744629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,2,balanced,0.25018133719762164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,2,balanced,0.2520586649576823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,2,power_law_1.01,0.2597759962081909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,2,power_law_1.01,0.28801279067993163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,2,power_law_1.2,0.268556809425354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,2,power_law_1.2,0.2832767963409424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,4,balanced,0.1653493344783783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,4,balanced,0.1738026738166809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,4,power_law_1.01,0.17482240200042726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,4,power_law_1.01,0.1907520055770874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,4,power_law_1.2,0.19362560510635377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,4,power_law_1.2,0.19417599439620972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,8,balanced,0.11498666803042094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,8,balanced,0.11585600177447002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,8,power_law_1.01,0.150271999835968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,8,power_law_1.01,0.1515328049659729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,8,power_law_1.2,0.14126720428466796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,1,8,power_law_1.2,0.15930880308151246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,16,1,balanced,0.057589332262674965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,16,1,balanced,0.05761066575845083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,16,1,power_law_1.01,0.054553598165512085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,16,1,power_law_1.01,0.05637120008468628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,16,1,power_law_1.2,0.05324159860610962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,16,1,power_law_1.2,0.053913599252700804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,2,1,balanced,0.2571413318316142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,2,1,balanced,0.25830399990081787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,2,1,power_law_1.01,0.2637311935424805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,2,1,power_law_1.01,0.2642240047454834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,2,1,power_law_1.2,0.2667520046234131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,2,1,power_law_1.2,0.26686079502105714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,32,1,balanced,0.035605333745479584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,32,1,balanced,0.03909866760174433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,32,1,power_law_1.01,0.03689599931240082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,32,1,power_law_1.01,0.03792639970779419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,32,1,power_law_1.2,0.03654400110244751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,32,1,power_law_1.2,0.03775359988212586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,4,1,balanced,0.14619732896486917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,4,1,balanced,0.15365333358446756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,4,1,power_law_1.01,0.1431040048599243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,4,1,power_law_1.01,0.14565119743347169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,4,1,power_law_1.2,0.1443711996078491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,4,1,power_law_1.2,0.14602240324020385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,8,1,balanced,0.09705066680908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,8,1,balanced,0.09826133648554485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,8,1,power_law_1.01,0.08908799886703492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,8,1,power_law_1.01,0.09038079977035522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,8,1,power_law_1.2,0.09146239757537841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,14336,2,8,8,1,power_law_1.2,0.09200639724731445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,1,balanced,0.7220266660054525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,1,balanced,0.7220799922943115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,1,power_law_1.01,0.6127103805541992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,1,power_law_1.01,0.6172351837158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,1,power_law_1.2,0.610591983795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,1,power_law_1.2,0.6142399787902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,128,balanced,0.041365332901477814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,128,balanced,0.041562666495641075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,128,power_law_1.01,0.039705601334571836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,128,power_law_1.01,0.040038400888442995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,128,power_law_1.2,0.039987200498580934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,128,power_law_1.2,0.04012160003185272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,16,balanced,0.08264533181985219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,16,balanced,0.0844533344109853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,16,power_law_1.01,0.07578880190849305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,16,power_law_1.01,0.0769216001033783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,16,power_law_1.2,0.07549440264701843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,16,power_law_1.2,0.07693439722061157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,2,balanced,0.3832586606343587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,2,balanced,0.384005347887675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,2,power_law_1.01,0.34552319049835206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,2,power_law_1.01,0.35070080757141114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,2,power_law_1.2,0.33016960620880126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,2,power_law_1.2,0.3371072053909302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,32,balanced,0.059301331639289856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,32,balanced,0.059621334075927734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,32,power_law_1.01,0.057222402095794676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,32,power_law_1.01,0.058406400680541995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,32,power_law_1.2,0.0554751992225647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,32,power_law_1.2,0.055878400802612305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,4,balanced,0.2143253286679586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,4,balanced,0.21620267629623413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,4,power_law_1.01,0.18970880508422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,4,power_law_1.01,0.19780479669570922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,4,power_law_1.2,0.1862912058830261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,4,power_law_1.2,0.20170240402221679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,64,balanced,0.04358399907747904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,64,balanced,0.04378666480382284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,64,power_law_1.01,0.04191359877586365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,64,power_law_1.01,0.04207360148429871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,64,power_law_1.2,0.04227840006351471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,64,power_law_1.2,0.04268159866333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,8,balanced,0.12764267126719156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,8,balanced,0.1286240021387736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,8,power_law_1.01,0.12194559574127198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,8,power_law_1.01,0.12360320091247559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,8,power_law_1.2,0.12112640142440796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,1,8,power_law_1.2,0.12150399684906006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,16,1,balanced,0.11794666449228923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,16,1,balanced,0.12052800258000691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,16,1,power_law_1.01,0.10215679407119752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,16,1,power_law_1.01,0.10305919647216796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,16,1,power_law_1.2,0.10207359790802002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,16,1,power_law_1.2,0.10224640369415283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,2,1,balanced,0.3800853490829468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,2,1,balanced,0.3859573205312093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,2,1,power_law_1.01,0.3151295900344849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,2,1,power_law_1.01,0.32033278942108157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,2,1,power_law_1.2,0.3229696035385132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,2,1,power_law_1.2,0.3275775909423828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,32,1,balanced,0.10389332969983418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,32,1,balanced,0.10705066720644633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,32,1,power_law_1.01,0.09088000059127807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,32,1,power_law_1.01,0.09205759763717651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,32,1,power_law_1.2,0.09129599928855896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,32,1,power_law_1.2,0.09223039746284485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,4,1,balanced,0.23255467414855957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,4,1,balanced,0.23480532566706339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,4,1,power_law_1.01,0.19775999784469606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,4,1,power_law_1.01,0.20286719799041747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,4,1,power_law_1.2,0.1923135995864868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,4,1,power_law_1.2,0.1974079966545105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,8,1,balanced,0.1609813372294108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,8,1,balanced,0.16223466396331787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,8,1,power_law_1.01,0.14177279472351073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,8,1,power_law_1.01,0.1448192000389099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,8,1,power_law_1.2,0.14126720428466796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,1536,8,128,8,1,power_law_1.2,0.14234880208969117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,1,balanced,4.783407847086589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,1,balanced,4.806384086608887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,1,power_law_1.01,3.5450817108154298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,1,power_law_1.01,3.5725887298583983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,1,power_law_1.2,3.454982376098633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,1,power_law_1.2,3.485606384277344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,128,balanced,0.12928533554077148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,128,balanced,0.12964800000190735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,128,power_law_1.01,0.12609280347824098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,128,power_law_1.01,0.12712960243225097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,128,power_law_1.2,0.12449920177459717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,128,power_law_1.2,0.1278720021247864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,16,balanced,0.3964800039927165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,16,balanced,0.3975626627604167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,16,power_law_1.01,0.37793920040130613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,16,power_law_1.01,0.39207680225372316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,16,power_law_1.2,0.36168320178985597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,16,power_law_1.2,0.3812096118927002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,2,balanced,2.4252586364746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,2,balanced,2.426208019256592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,2,power_law_1.01,1.8836992263793946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,2,power_law_1.01,1.9887424468994142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,2,power_law_1.2,1.8841983795166015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,2,power_law_1.2,1.8957120895385742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,256,balanced,0.1069653332233429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,256,balanced,0.10719466209411621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,256,power_law_1.01,0.10467840433120727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,256,power_law_1.01,0.10571520328521729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,256,power_law_1.2,0.105075204372406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,256,power_law_1.2,0.1051967978477478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,32,balanced,0.2502506573994954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,32,balanced,0.25094399849573773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,32,power_law_1.01,0.22135040760040284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,32,power_law_1.01,0.22564480304718018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,32,power_law_1.2,0.22282240390777588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,32,power_law_1.2,0.2298815965652466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,4,balanced,1.2648746967315674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,4,balanced,1.2675200303395588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,4,power_law_1.01,1.1133567810058593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,4,power_law_1.01,1.1337087631225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,4,power_law_1.2,1.0222720146179198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,4,power_law_1.2,1.078758430480957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,64,balanced,0.17196265856424967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,64,balanced,0.17271467049916586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,64,power_law_1.01,0.16490880250930787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,64,power_law_1.01,0.16622079610824586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,64,power_law_1.2,0.1619968056678772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,64,power_law_1.2,0.16702719926834106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,8,balanced,0.6856853167215983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,8,balanced,0.687887986501058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,8,power_law_1.01,0.6273791790008545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,8,power_law_1.01,0.6513343811035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,8,power_law_1.2,0.630675220489502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,1,8,power_law_1.2,0.6580543994903565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,16,1,balanced,1.42793607711792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,16,1,balanced,1.4281493822733562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,16,1,power_law_1.01,1.0627967834472656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,16,1,power_law_1.01,1.0821056365966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,16,1,power_law_1.2,1.0486271858215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,16,1,power_law_1.2,1.0675007820129394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,2,1,balanced,2.397653261820475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,2,1,balanced,2.4018239974975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,2,1,power_law_1.01,1.7946048736572267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,2,1,power_law_1.01,1.8048639297485352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,2,1,power_law_1.2,1.7644992828369142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,2,1,power_law_1.2,1.7928064346313477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,32,1,balanced,1.1799306869506836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,32,1,balanced,1.1812693277994792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,32,1,power_law_1.01,0.8824383735656738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,32,1,power_law_1.01,0.8902912139892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,32,1,power_law_1.2,0.8784895896911621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,32,1,power_law_1.2,0.8872896194458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,4,1,balanced,1.4236799875895183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,4,1,balanced,1.4261120160420735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,4,1,power_law_1.01,1.0483903884887695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,4,1,power_law_1.01,1.063206386566162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,4,1,power_law_1.2,1.0432064056396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,4,1,power_law_1.2,1.064025592803955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,8,1,balanced,0.7998613516489664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,8,1,balanced,0.8005119959513346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,8,1,power_law_1.01,0.6089920043945313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,8,1,power_law_1.01,0.609990406036377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,8,1,power_law_1.2,0.6037119865417481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,4096,2688,22,512,8,1,power_law_1.2,0.6062592029571533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,1,balanced,0.7199892997741699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,1,balanced,0.720789353052775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,1,power_law_1.01,0.7744383811950684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,1,power_law_1.01,0.7788288116455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,1,power_law_1.2,0.7636864185333252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,1,power_law_1.2,0.8009023666381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,2,balanced,0.38386666774749756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,2,balanced,0.4024053414662679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,2,power_law_1.01,0.4049215793609619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,2,power_law_1.01,0.4536384105682373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,2,power_law_1.2,0.46472959518432616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,2,power_law_1.2,0.47128958702087403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,4,balanced,0.22498132785161337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,4,balanced,0.2281066576639811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,4,power_law_1.01,0.262937593460083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,4,power_law_1.01,0.2745856046676636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,4,power_law_1.2,0.289516806602478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,4,power_law_1.2,0.2926016092300415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,8,balanced,0.15078933040301004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,8,balanced,0.1570133368174235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,8,power_law_1.01,0.19428479671478271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,8,power_law_1.01,0.2220736026763916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,8,power_law_1.2,0.19455360174179076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,1,8,power_law_1.2,0.19465600252151488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,16,1,balanced,0.07226666808128357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,16,1,balanced,0.0724533349275589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,16,1,power_law_1.01,0.07215359807014465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,16,1,power_law_1.01,0.07255679965019227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,16,1,power_law_1.2,0.07341439723968506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,16,1,power_law_1.2,0.07456640005111695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,2,1,balanced,0.3784373203913371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,2,1,balanced,0.4087626536687215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,2,1,power_law_1.01,0.405401611328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,2,1,power_law_1.01,0.41121277809143064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,2,1,power_law_1.2,0.39328000545501707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,2,1,power_law_1.2,0.4362495899200439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,32,1,balanced,0.05392000079154968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,32,1,balanced,0.054058666030565895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,32,1,power_law_1.01,0.051923197507858274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,32,1,power_law_1.01,0.05325440168380737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,32,1,power_law_1.2,0.0530239999294281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,32,1,power_law_1.2,0.05551360249519348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,4,1,balanced,0.21475734313329062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,4,1,balanced,0.2302186687787374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,4,1,power_law_1.01,0.21408638954162598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,4,1,power_law_1.01,0.2154752016067505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,4,1,power_law_1.2,0.21660799980163575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,4,1,power_law_1.2,0.21895039081573486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,8,1,balanced,0.13360533118247986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,8,1,balanced,0.14565866192181906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,8,1,power_law_1.01,0.12716799974441528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,8,1,power_law_1.01,0.13032959699630736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,8,1,power_law_1.2,0.13189760446548462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,16384,2,8,8,1,power_law_1.2,0.13322880268096923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,1,balanced,2.6985867818196616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,1,balanced,2.7073974609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,1,power_law_1.01,1.3823871612548828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,1,power_law_1.01,1.4216064453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,1,power_law_1.2,1.2534527778625488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,1,power_law_1.2,1.2931327819824219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,128,balanced,0.0765066643555959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,128,balanced,0.07683733105659485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,128,power_law_1.01,0.07502719759941101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,128,power_law_1.01,0.07608960270881653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,128,power_law_1.2,0.07562879920005798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,128,power_law_1.2,0.07587839961051941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,16,balanced,0.23456533749898276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,16,balanced,0.23511467377344766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,16,power_law_1.01,0.17415679693222047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,16,power_law_1.01,0.1958143949508667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,16,power_law_1.2,0.19054720401763917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,16,power_law_1.2,0.2015552043914795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,2,balanced,1.381930669148763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,2,balanced,1.382570743560791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,2,power_law_1.01,0.7420928001403808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,2,power_law_1.01,0.7695168018341064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,2,power_law_1.2,0.729036808013916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,2,power_law_1.2,0.7646912097930908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,256,balanced,0.06223999957243601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,256,balanced,0.06229866544405619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,256,power_law_1.01,0.06106879711151123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,256,power_law_1.01,0.06157439947128296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,256,power_law_1.2,0.061343997716903687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,32,balanced,0.1518239974975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,32,balanced,0.1532693306605021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,32,power_law_1.01,0.12265599966049194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,32,power_law_1.01,0.14092799425125122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,32,power_law_1.2,0.1183616042137146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,32,power_law_1.2,0.1223680019378662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,4,balanced,0.728607972462972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,4,balanced,0.7322666645050049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,4,power_law_1.01,0.4590400218963623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,4,power_law_1.01,0.5348800182342529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,4,power_law_1.2,0.45095038414001465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,4,power_law_1.2,0.5064832210540772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,64,balanced,0.09865599870681763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,64,balanced,0.09902933239936829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,64,power_law_1.01,0.08605440258979798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,64,power_law_1.01,0.08755840063095092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,64,power_law_1.2,0.08675199747085571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,64,power_law_1.2,0.09214720129966736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,8,balanced,0.3917119900385539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,8,balanced,0.393887996673584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,8,power_law_1.01,0.3150399923324585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,8,power_law_1.01,0.331443190574646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,8,power_law_1.2,0.2922048091888428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,1,8,power_law_1.2,0.31267199516296384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,16,1,balanced,0.3345866600672404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,16,1,balanced,0.3368053436279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,16,1,power_law_1.01,0.1998975992202759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,16,1,power_law_1.01,0.20185599327087403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,16,1,power_law_1.2,0.1788480043411255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,16,1,power_law_1.2,0.18436479568481445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,2,1,balanced,1.4016532897949219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,2,1,balanced,1.4044426282246907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,2,1,power_law_1.01,0.7247488021850585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,2,1,power_law_1.01,0.7403200149536133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,2,1,power_law_1.2,0.6696191787719726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,2,1,power_law_1.2,0.6868735790252686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,32,1,balanced,0.2801919976870219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,32,1,balanced,0.28332799673080444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,32,1,power_law_1.01,0.15850239992141724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,32,1,power_law_1.01,0.16019840240478517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,32,1,power_law_1.2,0.14431999921798705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,32,1,power_law_1.2,0.14812159538269043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,4,1,balanced,0.7719733715057373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,4,1,balanced,0.7747039794921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,4,1,power_law_1.01,0.4181503772735596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,4,1,power_law_1.01,0.42098560333251955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,4,1,power_law_1.2,0.3784064054489136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,4,1,power_law_1.2,0.390720009803772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,8,1,balanced,0.4755306641260783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,8,1,balanced,0.47621333599090576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,8,1,power_law_1.01,0.27352960109710694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,8,1,power_law_1.01,0.2735680103302002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,8,1,power_law_1.2,0.25483520030975343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2048,8,256,8,1,power_law_1.2,0.2587199926376343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,1,balanced,2.1257386207580566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,1,balanced,2.1291146278381348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,1,power_law_1.01,1.6855487823486328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,1,power_law_1.01,1.6870655059814452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,1,power_law_1.2,1.6187711715698243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,1,power_law_1.2,1.6194368362426759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,16,balanced,0.18096532424290976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,16,balanced,0.1819360057512919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,16,power_law_1.01,0.16293760538101196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,16,power_law_1.01,0.16583679914474486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,16,power_law_1.2,0.16373759508132935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,16,power_law_1.2,0.17508480548858643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,2,balanced,1.0890080134073894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,2,balanced,1.094058672587077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,2,power_law_1.01,0.8733823776245118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,2,power_law_1.01,0.8856191635131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,2,power_law_1.2,0.8929408073425293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,2,power_law_1.2,0.9388863563537597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,32,balanced,0.11802666385968526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,32,balanced,0.11930666367212932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,32,power_law_1.01,0.10932480096817017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,32,power_law_1.01,0.11175040006637574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,32,power_law_1.2,0.10228480100631714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,32,power_law_1.2,0.11326719522476196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,4,balanced,0.5803626775741577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,4,balanced,0.5806293487548828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,4,power_law_1.01,0.49125118255615235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,4,power_law_1.01,0.5012671947479248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,4,power_law_1.2,0.5149631977081299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,4,power_law_1.2,0.515174388885498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,8,balanced,0.3125973343849182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,8,balanced,0.31462399164835614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,8,power_law_1.01,0.2837440013885498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,8,power_law_1.01,0.2904191970825195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,8,power_law_1.2,0.26268160343170166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,1,8,power_law_1.2,0.268505597114563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,16,1,balanced,0.2587413390477498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,16,1,balanced,0.26078933477401733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,16,1,power_law_1.01,0.21465599536895752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,16,1,power_law_1.01,0.21960320472717285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,16,1,power_law_1.2,0.21780478954315186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,16,1,power_law_1.2,0.2191231966018677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,2,1,balanced,1.0887573560078938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,2,1,balanced,1.0898293654123943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,2,1,power_law_1.01,0.8515839576721191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,2,1,power_law_1.01,0.8530240058898926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,2,1,power_law_1.2,0.8391743659973144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,2,1,power_law_1.2,0.8558015823364258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,32,1,balanced,0.20403200387954712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,32,1,balanced,0.20589866240819296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,32,1,power_law_1.01,0.15367679595947265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,32,1,power_law_1.01,0.1538624048233032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,32,1,power_law_1.2,0.15319679975509642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,32,1,power_law_1.2,0.15325440168380738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,4,1,balanced,0.6033546527226766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,4,1,balanced,0.6207840045293173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,4,1,power_law_1.01,0.4651648044586182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,4,1,power_law_1.01,0.46682238578796387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,4,1,power_law_1.2,0.4650112152099609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,4,1,power_law_1.2,0.46503682136535646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,8,1,balanced,0.3658986488978068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,8,1,balanced,0.36692798137664795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,8,1,power_law_1.01,0.28929920196533204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,8,1,power_law_1.01,0.29166719913482664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,8,1,power_law_1.2,0.2897855997085571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,6144,2560,8,160,8,1,power_law_1.2,0.2916287899017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,1,balanced,3.1471840540568032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,1,balanced,3.1476799647013345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,1,power_law_1.01,1.5869376182556152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,1,power_law_1.01,1.5876992225646973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,1,power_law_1.2,1.5044992446899415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,1,power_law_1.2,1.5467264175415039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,128,balanced,0.08639466762542725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,128,balanced,0.08729599912961324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,128,power_law_1.01,0.08498560190200806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,128,power_law_1.01,0.08532480001449586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,128,power_law_1.2,0.08501759767532349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,128,power_law_1.2,0.08515840172767639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,16,balanced,0.27317333221435547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,16,balanced,0.2786399920781453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,16,power_law_1.01,0.23780479431152343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,16,power_law_1.01,0.24466559886932374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,16,power_law_1.2,0.20277760028839112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,16,power_law_1.2,0.21990399360656737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,2,balanced,1.6055199305216472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,2,balanced,1.6082666714986165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,2,power_law_1.01,0.895199966430664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,2,power_law_1.01,1.009932804107666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,2,power_law_1.2,0.8355648040771484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,2,power_law_1.2,0.8382528305053711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,256,balanced,0.07025066514809926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,256,balanced,0.07251200079917908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,256,power_law_1.01,0.06972159743309021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,256,power_law_1.01,0.07000319957733155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,256,power_law_1.2,0.0704255998134613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,256,power_law_1.2,0.07051519751548767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,32,balanced,0.17565866311391196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,32,balanced,0.18069867293039957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,32,power_law_1.01,0.12940800189971924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,32,power_law_1.01,0.15507839918136596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,32,power_law_1.2,0.12547199726104735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,32,power_law_1.2,0.16503679752349854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,4,balanced,0.8452373345692953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,4,balanced,0.8455893198649088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,4,power_law_1.01,0.5617792129516601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,4,power_law_1.01,0.5642816066741944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,4,power_law_1.2,0.5429247856140137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,4,power_law_1.2,0.5429823875427247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,64,balanced,0.11101866761843364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,64,balanced,0.11136000355084737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,64,power_law_1.01,0.10087679624557495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,64,power_law_1.01,0.10655360221862793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,64,power_law_1.2,0.09688320159912109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,64,power_law_1.2,0.10274560451507568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,8,balanced,0.4527093172073364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,8,balanced,0.46191998322804767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,8,power_law_1.01,0.37015039920806886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,8,power_law_1.01,0.41096959114074705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,8,power_law_1.2,0.33886721134185793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,1,8,power_law_1.2,0.42905597686767577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,16,1,balanced,0.387664000193278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,16,1,balanced,0.3880373239517212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,16,1,power_law_1.01,0.2306879997253418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,16,1,power_law_1.01,0.23618559837341307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,16,1,power_law_1.2,0.21086719036102294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,16,1,power_law_1.2,0.2190783977508545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,2,1,balanced,1.6336906750996907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,2,1,balanced,1.6393225987752278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,2,1,power_law_1.01,0.8606080055236817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,2,1,power_law_1.01,0.880031967163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,2,1,power_law_1.2,0.7896512031555176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,2,1,power_law_1.2,0.8026111602783204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,32,1,balanced,0.32845866680145264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,32,1,balanced,0.3298773368199666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,32,1,power_law_1.01,0.1805888056755066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,32,1,power_law_1.01,0.18497920036315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,32,1,power_law_1.2,0.16519039869308472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,32,1,power_law_1.2,0.1670016050338745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,4,1,balanced,0.8996427059173584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,4,1,balanced,0.9327627023061117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,4,1,power_law_1.01,0.4791999816894531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,4,1,power_law_1.01,0.48329601287841795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,4,1,power_law_1.2,0.44590082168579104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,4,1,power_law_1.2,0.45197439193725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,8,1,balanced,0.5495626529057821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,8,1,balanced,0.5511786540349325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,8,1,power_law_1.01,0.3145279884338379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,8,1,power_law_1.01,0.3170687913894653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,8,1,power_law_1.2,0.28755199909210205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,256,8,1,power_law_1.2,0.29580800533294677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,1,balanced,3.1480798721313477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,1,balanced,3.148554801940918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,1,power_law_1.01,2.0314111709594727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,1,power_law_1.01,2.065388870239258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,1,power_law_1.2,1.8379968643188476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,1,power_law_1.2,1.8420671463012694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,128,balanced,0.08647466699282329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,128,balanced,0.08904000123341878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,128,power_law_1.01,0.09155200123786926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,128,power_law_1.01,0.09316480159759521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,128,power_law_1.2,0.08940799832344055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,128,power_law_1.2,0.09018880128860474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,16,balanced,0.2709333300590515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,16,balanced,0.2720213333765666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,16,power_law_1.01,0.3535871982574463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,16,power_law_1.01,0.35817599296569824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,16,power_law_1.2,0.32639360427856445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,16,power_law_1.2,0.35834240913391113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,2,balanced,1.6100266774495442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,2,balanced,1.6118613878885906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,2,power_law_1.01,1.204422378540039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,2,power_law_1.01,1.2124799728393554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,2,power_law_1.2,1.1524224281311035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,2,power_law_1.2,1.154368019104004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,32,balanced,0.17756799856821695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,32,balanced,0.1792959968249003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,32,power_law_1.01,0.18673919439315795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,32,power_law_1.01,0.20446720123291015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,32,power_law_1.2,0.1832576036453247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,32,power_law_1.2,0.20858240127563477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,4,balanced,0.8432532946268717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,4,balanced,0.8469866911570231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,4,power_law_1.01,0.7445375919342041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,4,power_law_1.01,0.7978943824768067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,4,power_law_1.2,0.6572288036346435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,4,power_law_1.2,0.724889612197876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,64,balanced,0.11265066266059875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,64,balanced,0.11296533544858296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,64,power_law_1.01,0.11783679723739623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,64,power_law_1.01,0.11790080070495605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,64,power_law_1.2,0.11365760564804077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,64,power_law_1.2,0.11763839721679688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,8,balanced,0.4522560040156047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,8,balanced,0.4551200071970622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,8,power_law_1.01,0.5281792163848877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,8,power_law_1.01,0.579641580581665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,8,power_law_1.2,0.503545618057251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,1,8,power_law_1.2,0.5574207782745362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,16,1,balanced,0.389850656191508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,16,1,balanced,0.4036426544189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,16,1,power_law_1.01,0.2647167921066284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,16,1,power_law_1.01,0.2658047914505005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,16,1,power_law_1.2,0.2474303960800171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,16,1,power_law_1.2,0.24980480670928956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,2,1,balanced,1.6321172714233398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,2,1,balanced,1.6328266461690266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,2,1,power_law_1.01,1.064844799041748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,2,1,power_law_1.01,1.1026944160461425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,2,1,power_law_1.2,0.9576959609985352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,2,1,power_law_1.2,0.9826751708984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,32,1,balanced,0.3298400044441223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,32,1,balanced,0.33007999261220294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,32,1,power_law_1.01,0.21083519458770753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,32,1,power_law_1.01,0.2125312089920044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,32,1,power_law_1.2,0.20312960147857667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,32,1,power_law_1.2,0.2043328046798706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,4,1,balanced,0.9021759827931722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,4,1,balanced,0.9105172952016195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,4,1,power_law_1.01,0.5932672023773193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,4,1,power_law_1.01,0.5987648010253906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,4,1,power_law_1.2,0.545420789718628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,4,1,power_law_1.2,0.5459904193878173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,8,1,balanced,0.5506240129470825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,8,1,balanced,0.5541119972864786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,8,1,power_law_1.01,0.3833600044250488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,8,1,power_law_1.01,0.38416640758514403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,8,1,power_law_1.2,0.3414144039154053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,32,7168,2048,8,384,8,1,power_law_1.2,0.34202880859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,1,balanced,0.27160000801086426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,1,balanced,0.27320533990859985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,1,power_law_1.01,0.25345280170440676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,1,power_law_1.01,0.2548095941543579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,1,power_law_1.2,0.25776000022888185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,1,power_law_1.2,0.25919361114501954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,128,balanced,0.053370664517084755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,128,balanced,0.05401599903901418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,128,power_law_1.01,0.051583999395370485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,128,power_law_1.01,0.05221760272979736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,128,power_law_1.2,0.05381760001182556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,128,power_law_1.2,0.05384960174560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,16,balanced,0.06141333281993866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,16,balanced,0.062319998939832054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,16,power_law_1.01,0.06190720200538635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,16,power_law_1.01,0.06255360245704651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,16,power_law_1.2,0.06330239772796631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,16,power_law_1.2,0.06388480067253113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,2,balanced,0.14176533619562784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,2,balanced,0.14718400438626608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,2,power_law_1.01,0.1384768009185791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,2,power_law_1.01,0.1435647964477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,2,power_law_1.2,0.13978240489959717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,2,power_law_1.2,0.14569599628448487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,32,balanced,0.052154665191968284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,32,balanced,0.05382933219273885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,32,power_law_1.01,0.05273600220680237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,32,power_law_1.01,0.05304319858551025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,32,power_law_1.2,0.052300798892974856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,32,power_law_1.2,0.053600001335144046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,4,balanced,0.09683199723561604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,4,balanced,0.09707199533780415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,4,power_law_1.01,0.09875199794769288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,4,power_law_1.01,0.09878399968147278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,4,power_law_1.2,0.10094720125198364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,4,power_law_1.2,0.10261759757995606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,64,balanced,0.052671998739242554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,64,balanced,0.053861334919929504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,64,power_law_1.01,0.05395200252532959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,64,power_law_1.01,0.05541120171546936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,64,power_law_1.2,0.05477759838104248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,64,power_law_1.2,0.0551360011100769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,8,balanced,0.07417066891988118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,8,balanced,0.0745600014925003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,8,power_law_1.01,0.07323520183563233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,8,power_law_1.01,0.07412480115890503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,8,power_law_1.2,0.0747648000717163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,1,8,power_law_1.2,0.0748095989227295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,2,1,balanced,0.13611732920010886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,2,1,balanced,0.13661866386731467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,2,1,power_law_1.01,0.13344639539718628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,2,1,power_law_1.01,0.13392640352249147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,2,1,power_law_1.2,0.1350399971008301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,2,1,power_law_1.2,0.13671040534973145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,4,1,balanced,0.09126399954160054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,4,1,balanced,0.09204799930254619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,4,1,power_law_1.01,0.08899840116500854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,4,1,power_law_1.01,0.09032959938049316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,4,1,power_law_1.2,0.09121919870376587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2048,768,8,128,4,1,power_law_1.2,0.09234560132026673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,1,balanced,0.6070133447647095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,1,balanced,0.6093226671218872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,1,power_law_1.01,0.628607988357544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,1,power_law_1.01,0.6353919982910157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,1,power_law_1.2,0.6459904193878174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,1,power_law_1.2,0.6577727794647217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,128,balanced,0.07256533205509186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,128,balanced,0.07414933542410533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,128,power_law_1.01,0.0729856014251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,128,power_law_1.01,0.07379199862480164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,128,power_law_1.2,0.07428479790687562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,128,power_law_1.2,0.0743615984916687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,16,balanced,0.09266666571299235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,16,balanced,0.09335999687512715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,16,power_law_1.01,0.09190400242805481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,16,power_law_1.01,0.09357439875602722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,16,power_law_1.2,0.09316480159759521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,16,power_law_1.2,0.09663360118865967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,2,balanced,0.3671040137608846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,2,balanced,0.3713173468907674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,2,power_law_1.01,0.34610559940338137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,2,power_law_1.01,0.35779199600219724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,2,power_law_1.2,0.35214719772338865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,2,power_law_1.2,0.3604095935821533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,32,balanced,0.0817386656999588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,32,balanced,0.08338133494059245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,32,power_law_1.01,0.07971839904785157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,32,power_law_1.01,0.08095359802246094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,32,power_law_1.2,0.08155519962310791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,32,power_law_1.2,0.08270080089569092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,4,balanced,0.21730667352676392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,4,balanced,0.21753599246342978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,4,power_law_1.01,0.2081536054611206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,4,power_law_1.01,0.21283841133117676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,4,power_law_1.2,0.20631039142608643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,4,power_law_1.2,0.21181440353393555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,64,balanced,0.07449600100517273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,64,balanced,0.07645866771539052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,64,power_law_1.01,0.07683839797973632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,64,power_law_1.01,0.07742080092430115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,64,power_law_1.2,0.07707520127296448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,64,power_law_1.2,0.07722240090370178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,8,balanced,0.1420693298180898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,8,balanced,0.14250133434931436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,8,power_law_1.01,0.13633279800415038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,8,power_law_1.01,0.14205440282821655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,8,power_law_1.2,0.1390720009803772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,1,8,power_law_1.2,0.1403712034225464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,16,1,balanced,0.22427199284235635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,16,1,balanced,0.225055992603302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,16,1,power_law_1.01,0.21812479496002196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,16,1,power_law_1.01,0.21896960735321044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,16,1,power_law_1.2,0.2255552053451538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,16,1,power_law_1.2,0.22619519233703614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,2,1,balanced,0.3551199833552043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,2,1,balanced,0.3569493293762207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,2,1,power_law_1.01,0.33902080059051515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,2,1,power_law_1.01,0.3407615900039673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,2,1,power_law_1.2,0.34348158836364745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,2,1,power_law_1.2,0.3491647958755493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,32,1,balanced,0.19114667177200317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,32,1,balanced,0.19282132387161255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,32,1,power_law_1.01,0.18880000114440917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,32,1,power_law_1.01,0.19192320108413696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,32,1,power_law_1.2,0.1929919958114624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,32,1,power_law_1.2,0.19404799938201905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,4,1,balanced,0.2100213368733724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,4,1,balanced,0.21042666832605997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,4,1,power_law_1.01,0.20099198818206787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,4,1,power_law_1.01,0.20310399532318116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,4,1,power_law_1.2,0.20465919971466065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,4,1,power_law_1.2,0.20561280250549316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,8,1,balanced,0.3276639978090922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,8,1,balanced,0.3284426728884379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,8,1,power_law_1.01,0.31536641120910647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,8,1,power_law_1.01,0.320032000541687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,8,1,power_law_1.2,0.3255167961120605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,2688,1856,6,128,8,1,power_law_1.2,0.32699520587921144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,1,balanced,1.1891573270161946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,1,balanced,1.1959413687388103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,1,power_law_1.01,1.0110976219177246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,1,power_law_1.01,1.0223936080932616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,1,power_law_1.2,1.0444095611572266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,1,power_law_1.2,1.053593635559082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,128,balanced,0.10917866230010986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,128,balanced,0.10966933767000835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,128,power_law_1.01,0.10753920078277587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,128,power_law_1.01,0.10954240560531617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,128,power_law_1.2,0.11018879413604736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,128,power_law_1.2,0.11263999938964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,16,balanced,0.1684160033861796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,16,balanced,0.16881599028905234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,16,power_law_1.01,0.14678399562835692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,16,power_law_1.01,0.14880000352859496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,16,power_law_1.2,0.16362240314483642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,16,power_law_1.2,0.1664512038230896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,2,balanced,0.6307573318481445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,2,balanced,0.6352159976959229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,2,power_law_1.01,0.5647359848022461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,2,power_law_1.01,0.578611183166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,2,power_law_1.2,0.5821631908416748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,2,power_law_1.2,0.5914624214172364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,256,balanced,0.10726400216420491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,256,balanced,0.10730666915575664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,256,power_law_1.01,0.10533759593963624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,256,power_law_1.01,0.10597120523452759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,256,power_law_1.2,0.10703359842300415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,256,power_law_1.2,0.10737919807434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,32,balanced,0.12355200449625652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,32,balanced,0.12386666735013326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,32,power_law_1.01,0.1192896008491516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,32,power_law_1.01,0.11994880437850952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,32,power_law_1.2,0.12227840423583984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,32,power_law_1.2,0.12310400009155273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,4,balanced,0.3682933251063029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,4,balanced,0.3699093262354533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,4,power_law_1.01,0.34257919788360597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,4,power_law_1.01,0.35066239833831786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,4,power_law_1.2,0.3486272096633911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,4,power_law_1.2,0.3526400089263916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,64,balanced,0.11371200283368428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,64,balanced,0.11469866832097371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,64,power_law_1.01,0.11246720552444459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,64,power_law_1.01,0.11273599863052368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,64,power_law_1.2,0.11359360218048095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,64,power_law_1.2,0.11389440298080444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,8,balanced,0.23163733879725137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,8,balanced,0.23283199469248453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,8,power_law_1.01,0.21838080883026123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,8,power_law_1.01,0.21958398818969727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,8,power_law_1.2,0.21772799491882325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,1,8,power_law_1.2,0.22118399143218995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,16,1,balanced,0.16967999935150146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,16,1,balanced,0.17133333285649618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,16,1,power_law_1.01,0.1580288052558899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,16,1,power_law_1.01,0.158297598361969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,16,1,power_law_1.2,0.163481605052948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,16,1,power_law_1.2,0.1637760043144226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,2,1,balanced,0.610912005106608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,2,1,balanced,0.611407995223999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,2,1,power_law_1.01,0.5430016040802002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,2,1,power_law_1.01,0.5474368095397949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,2,1,power_law_1.2,0.5495552062988281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,2,1,power_law_1.2,0.5604415893554687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,32,1,balanced,0.12713600198427835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,32,1,balanced,0.12757866581281027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,32,1,power_law_1.01,0.12174719572067261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,32,1,power_law_1.01,0.12233599424362182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,32,1,power_law_1.2,0.12195199728012085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,32,1,power_law_1.2,0.12279679775238037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,4,1,balanced,0.3445333242416382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,4,1,balanced,0.3452266852060954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,4,1,power_law_1.01,0.3149183988571167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,4,1,power_law_1.01,0.3215167999267578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,4,1,power_law_1.2,0.32274560928344725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,4,1,power_law_1.2,0.32520959377288816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,8,1,balanced,0.21106666326522827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,8,1,balanced,0.2139093279838562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,8,1,power_law_1.01,0.1963711977005005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,8,1,power_law_1.01,0.19783040285110473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,8,1,power_law_1.2,0.19900159835815429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,3072,1536,8,256,8,1,power_law_1.2,0.2006848096847534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,1,balanced,0.7400906880696615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,1,balanced,0.7424426873524984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,1,power_law_1.01,0.789247989654541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,1,power_law_1.01,0.815129566192627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,1,power_law_1.2,0.794975996017456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,1,power_law_1.2,0.8092800140380859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,2,balanced,0.40745067596435547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,2,balanced,0.4086666504542033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,2,power_law_1.01,0.4919424057006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,2,power_law_1.01,0.5107903957366944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,2,power_law_1.2,0.5014400005340576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,2,power_law_1.2,0.5070015907287597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,4,balanced,0.3022986650466919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,4,balanced,0.30594666798909503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,4,power_law_1.01,0.330297589302063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,4,power_law_1.01,0.3359296083450317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,4,power_law_1.2,0.3337791919708252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,4,power_law_1.2,0.34904959201812746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,8,balanced,0.25179733832677204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,8,balanced,0.255237340927124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,8,power_law_1.01,0.279532790184021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,8,power_law_1.01,0.2864511966705322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,8,power_law_1.2,0.28123519420623777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,1,8,power_law_1.2,0.29049599170684814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,16,1,balanced,0.0918239951133728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,16,1,balanced,0.0925546685854594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,16,1,power_law_1.01,0.09141119718551635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,16,1,power_law_1.01,0.09201920032501221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,16,1,power_law_1.2,0.08894079923629761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,16,1,power_law_1.2,0.08922880291938781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,2,1,balanced,0.3920746644337972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,2,1,balanced,0.3935946623484294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,2,1,power_law_1.01,0.38064639568328856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,2,1,power_law_1.01,0.39438719749450685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,2,1,power_law_1.2,0.3835135936737061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,2,1,power_law_1.2,0.3864255905151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,32,1,balanced,0.08056533336639404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,32,1,balanced,0.08111466467380524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,32,1,power_law_1.01,0.07594879865646362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,32,1,power_law_1.01,0.07692800164222717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,32,1,power_law_1.2,0.07647359967231751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,32,1,power_law_1.2,0.07715200185775757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,4,1,balanced,0.2246560057004293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,4,1,balanced,0.22830933332443237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,4,1,power_law_1.01,0.2105855941772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,4,1,power_law_1.01,0.21251199245452881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,4,1,power_law_1.2,0.2030400037765503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,4,1,power_law_1.2,0.20908799171447753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,8,1,balanced,0.1476906637350718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,8,1,balanced,0.1509866714477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,8,1,power_law_1.01,0.11631360054016113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,8,1,power_law_1.01,0.11813759803771973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,8,1,power_law_1.2,0.11963520050048829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,14336,2,8,8,1,power_law_1.2,0.12284799814224243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,1,balanced,0.7943627039591471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,1,balanced,0.796837329864502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,1,power_law_1.01,0.7802688121795655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,1,power_law_1.01,0.8014464378356934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,1,power_law_1.2,0.8005056381225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,1,power_law_1.2,0.8090239524841308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,128,balanced,0.09001066287358601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,128,balanced,0.09232532978057861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,128,power_law_1.01,0.09050880074501037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,128,power_law_1.01,0.09192960262298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,128,power_law_1.2,0.09322879910469055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,128,power_law_1.2,0.09479039907455444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,16,balanced,0.1216373344262441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,16,balanced,0.12304533521334331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,16,power_law_1.01,0.12253439426422119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,16,power_law_1.01,0.12367360591888428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,16,power_law_1.2,0.1273408055305481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,16,power_law_1.2,0.12735359668731688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,2,balanced,0.44415465990702313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,2,balanced,0.4461013476053874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,2,power_law_1.01,0.4393727779388428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,2,power_law_1.01,0.4445055961608887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,2,power_law_1.2,0.4514495849609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,2,power_law_1.2,0.4609087944030762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,32,balanced,0.1088746686776479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,32,balanced,0.10916800300280254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,32,power_law_1.01,0.10967040061950684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,32,power_law_1.01,0.10977280139923096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,32,power_law_1.2,0.11132160425186158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,32,power_law_1.2,0.1119871973991394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,4,balanced,0.25893332560857135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,4,balanced,0.2604373296101888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,4,power_law_1.01,0.2585536003112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,4,power_law_1.01,0.2676160097122192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,4,power_law_1.2,0.2724096059799194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,4,power_law_1.2,0.27764480113983153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,64,balanced,0.10356266299883525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,64,balanced,0.10482133428255717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,64,power_law_1.01,0.10478719472885131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,64,power_law_1.01,0.10545920133590699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,64,power_law_1.2,0.10573439598083496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,64,power_law_1.2,0.10618239641189575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,8,balanced,0.17067732413609824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,8,balanced,0.17076265811920166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,8,power_law_1.01,0.18290560245513915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,8,power_law_1.01,0.18789759874343873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,8,power_law_1.2,0.18538880348205566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,1,8,power_law_1.2,0.18994560241699218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,16,1,balanced,0.12702932953834534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,16,1,balanced,0.12801067034403482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,16,1,power_law_1.01,0.12602880001068115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,16,1,power_law_1.01,0.12684799432754518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,16,1,power_law_1.2,0.12754559516906738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,16,1,power_law_1.2,0.12893439531326295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,2,1,balanced,0.5070986747741699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,2,1,balanced,0.509333332379659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,2,1,power_law_1.01,0.4754623889923096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,2,1,power_law_1.01,0.4772480010986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,2,1,power_law_1.2,0.47757439613342284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,2,1,power_law_1.2,0.484281587600708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,32,1,balanced,0.11282133062680562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,32,1,balanced,0.11311466495196025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,32,1,power_law_1.01,0.11184639930725097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,32,1,power_law_1.01,0.11336319446563721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,32,1,power_law_1.2,0.11347839832305909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,4,1,balanced,0.24304533004760742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,4,1,balanced,0.24484266837437949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,4,1,power_law_1.01,0.241593599319458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,4,1,power_law_1.01,0.24335999488830568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,4,1,power_law_1.2,0.24282240867614746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,4,1,power_law_1.2,0.24389119148254396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,8,1,balanced,0.1588586668173472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,8,1,balanced,0.16037866473197937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,8,1,power_law_1.01,0.15685759782791137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,8,1,power_law_1.01,0.15783679485321045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,8,1,power_law_1.2,0.15508480072021485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,1536,8,128,8,1,power_law_1.2,0.15954560041427612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,1,balanced,5.471279780069987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,1,balanced,5.501701354980469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,1,power_law_1.01,5.04967041015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,1,power_law_1.01,5.076121520996094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,1,power_law_1.2,5.224319839477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,1,power_law_1.2,5.286073684692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,128,balanced,0.3331413269042969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,128,balanced,0.3345173199971517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,128,power_law_1.01,0.33274240493774415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,128,power_law_1.01,0.340774393081665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,128,power_law_1.2,0.33943679332733157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,128,power_law_1.2,0.3412224054336548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,16,balanced,0.6363253196080526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,16,balanced,0.6364213228225708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,16,power_law_1.01,0.6126527786254883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,16,power_law_1.01,0.6146624088287354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,16,power_law_1.2,0.6216320037841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,16,power_law_1.2,0.6289023876190185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,2,balanced,2.9119574228922525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,2,balanced,2.9520107905069985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,2,power_law_1.01,2.6666688919067383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,2,power_law_1.01,2.7130111694335937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,2,power_law_1.2,2.774982452392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,2,power_law_1.2,2.8152639389038088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,256,balanced,0.3283626635869344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,256,balanced,0.33026667435963947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,256,power_law_1.01,0.3307904005050659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,256,power_law_1.01,0.33137919902801516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,256,power_law_1.2,0.3335488080978394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,256,power_law_1.2,0.3338495969772339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,32,balanced,0.46907734870910645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,32,balanced,0.47017598152160645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,32,power_law_1.01,0.45783038139343263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,32,power_law_1.01,0.460422420501709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,32,power_law_1.2,0.4650112152099609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,32,power_law_1.2,0.46964478492736816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,4,balanced,1.560197353363037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,4,balanced,1.5711785952250164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,4,power_law_1.01,1.4846719741821288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,4,power_law_1.01,1.4855680465698242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,4,power_law_1.2,1.51278076171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,4,power_law_1.2,1.5129407882690429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,64,balanced,0.36740267276763916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,64,balanced,0.3676160176595052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,64,power_law_1.01,0.37669761180877687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,64,power_law_1.01,0.37776639461517336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,64,power_law_1.2,0.3898112058639526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,64,power_law_1.2,0.3978303909301758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,8,balanced,0.9410293102264404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,8,balanced,0.9413812955220541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,8,power_law_1.01,0.8873984336853027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,8,power_law_1.01,0.8910335540771485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,8,power_law_1.2,0.9079744338989257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,1,8,power_law_1.2,0.9328448295593261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,16,1,balanced,1.4768053690592449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,16,1,balanced,1.4797706604003906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,16,1,power_law_1.01,1.4047295570373535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,16,1,power_law_1.01,1.4239871978759766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,16,1,power_law_1.2,1.46046724319458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,16,1,power_law_1.2,1.4755647659301758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,2,1,balanced,2.550917307535807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,2,1,balanced,2.5678292910257974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,2,1,power_law_1.01,2.565465545654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,2,1,power_law_1.01,2.5953407287597656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,2,1,power_law_1.2,2.611897659301758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,2,1,power_law_1.2,2.696384048461914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,32,1,balanced,1.1712480386098225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,32,1,balanced,1.171445369720459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,32,1,power_law_1.01,1.1215935707092286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,32,1,power_law_1.01,1.1294848442077636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,32,1,power_law_1.2,1.176243209838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,32,1,power_law_1.2,1.1820799827575683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,4,1,balanced,1.4642292658487956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,4,1,balanced,1.4646453857421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,4,1,power_law_1.01,1.4931008338928222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,4,1,power_law_1.01,1.499020767211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,4,1,power_law_1.2,1.5411775588989258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,4,1,power_law_1.2,1.5504128456115722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,8,1,balanced,0.8027040163675944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,8,1,balanced,0.8073440392812093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,8,1,power_law_1.01,0.7596928119659424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,8,1,power_law_1.01,0.7633984088897705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,8,1,power_law_1.2,0.7948416233062744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,4096,2688,22,512,8,1,power_law_1.2,0.8036671638488769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,1,balanced,1.3215946356455486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,1,balanced,1.3609174092610676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,1,power_law_1.01,1.213759994506836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,1,power_law_1.01,1.2572799682617188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,1,power_law_1.2,1.1869952201843261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,1,power_law_1.2,1.2132736206054688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,2,balanced,0.6784373124440511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,2,balanced,0.6799413363138834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,2,power_law_1.01,0.7582592010498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,2,power_law_1.01,0.7591616153717041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,2,power_law_1.2,0.7764863967895508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,2,power_law_1.2,0.8006655693054199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,4,balanced,0.4065279960632324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,4,balanced,0.40884800752003986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,4,power_law_1.01,0.46151041984558105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,4,power_law_1.01,0.4634751796722412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,4,power_law_1.2,0.4634687900543213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,4,power_law_1.2,0.4642176151275635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,8,balanced,0.3228106697400411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,8,balanced,0.3229653239250183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,8,power_law_1.01,0.3543551921844482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,8,power_law_1.01,0.3663167953491211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,8,power_law_1.2,0.37532799243927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,1,8,power_law_1.2,0.3815167903900146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,16,1,balanced,0.11983467141787212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,16,1,balanced,0.12054933110872905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,16,1,power_law_1.01,0.11900160312652588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,16,1,power_law_1.01,0.1202623963356018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,16,1,power_law_1.2,0.11965440511703491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,16,1,power_law_1.2,0.12094080448150635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,2,1,balanced,0.6013546784718832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,2,1,balanced,0.6120479901631674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,2,1,power_law_1.01,0.5945792198181152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,2,1,power_law_1.01,0.5982143878936768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,2,1,power_law_1.2,0.5879615783691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,2,1,power_law_1.2,0.6019008159637451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,32,1,balanced,0.10290666421254475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,32,1,balanced,0.1032480001449585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,32,1,power_law_1.01,0.10160000324249267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,32,1,power_law_1.01,0.10190720558166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,32,1,power_law_1.2,0.10227839946746826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,32,1,power_law_1.2,0.10294400453567505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,4,1,balanced,0.3313279946645101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,4,1,balanced,0.3314239978790283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,4,1,power_law_1.01,0.3182463884353638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,4,1,power_law_1.01,0.3246783971786499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,4,1,power_law_1.2,0.31598079204559326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,4,1,power_law_1.2,0.32524158954620364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,8,1,balanced,0.20170666774113974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,8,1,balanced,0.20563199122746786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,8,1,power_law_1.01,0.1988800048828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,8,1,power_law_1.01,0.19946240186691283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,8,1,power_law_1.2,0.19232640266418458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,16384,2,8,8,1,power_law_1.2,0.20060160160064697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,1,balanced,3.120234807332357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,1,balanced,3.1746721267700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,1,power_law_1.01,2.6764799118041993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,1,power_law_1.01,2.699257659912109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,1,power_law_1.2,2.6921920776367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,1,power_law_1.2,2.7579839706420897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,128,balanced,0.18056533734003702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,128,balanced,0.18129066626230875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,128,power_law_1.01,0.17745920419692993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,128,power_law_1.01,0.17781120538711548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,128,power_law_1.2,0.17590399980545043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,128,power_law_1.2,0.18019200563430787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,16,balanced,0.33869866530100506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,16,balanced,0.3391626675923665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,16,power_law_1.01,0.30906240940093993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,16,power_law_1.01,0.32911360263824463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,16,power_law_1.2,0.32984960079193115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,16,power_law_1.2,0.32997760772705076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,2,balanced,1.6045014063517253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,2,balanced,1.6337439219156902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,2,power_law_1.01,1.371776008605957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,2,power_law_1.01,1.4102144241333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,2,power_law_1.2,1.4215744018554688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,2,power_law_1.2,1.4240832328796387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,256,balanced,0.1730560064315796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,256,balanced,0.1740586757659912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,256,power_law_1.01,0.17185920476913452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,256,power_law_1.01,0.17212159633636476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,256,power_law_1.2,0.17294080257415773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,256,power_law_1.2,0.17349120378494262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,32,balanced,0.22245333592096964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,32,balanced,0.22431999444961548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,32,power_law_1.01,0.2062079906463623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,32,power_law_1.01,0.2126528024673462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,32,power_law_1.2,0.22024319171905518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,32,power_law_1.2,0.2280832052230835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,4,balanced,0.857151985168457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,4,balanced,0.8585120042165121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,4,power_law_1.01,0.8014335632324219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,4,power_law_1.01,0.8205696105957031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,4,power_law_1.2,0.8236607551574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,4,power_law_1.2,0.8239871978759765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,64,balanced,0.18489599227905273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,64,balanced,0.1851253310839335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,64,power_law_1.01,0.18131840229034424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,64,power_law_1.01,0.18186880350112916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,64,power_law_1.2,0.18403840065002441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,64,power_law_1.2,0.18531839847564696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,8,balanced,0.5121226708094279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,8,balanced,0.5126293500264486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,8,power_law_1.01,0.4695744037628174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,8,power_law_1.01,0.490067195892334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,8,power_law_1.2,0.4867072105407715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,1,8,power_law_1.2,0.49120640754699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,16,1,balanced,0.3346506754557292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,16,1,balanced,0.3349119822184245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,16,1,power_law_1.01,0.2820735931396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,16,1,power_law_1.01,0.30842878818511965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,16,1,power_law_1.2,0.3109568119049072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,16,1,power_law_1.2,0.3216192007064819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,2,1,balanced,1.585792064666748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,2,1,balanced,1.5963733990987141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,2,1,power_law_1.01,1.3720447540283203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,2,1,power_law_1.01,1.373689556121826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,2,1,power_law_1.2,1.3818623542785644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,2,1,power_law_1.2,1.4044095993041992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,32,1,balanced,0.23425600926081339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,32,1,balanced,0.23487999041875204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,32,1,power_law_1.01,0.2211008071899414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,32,1,power_law_1.01,0.22163839340209962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,32,1,power_law_1.2,0.2231679916381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,32,1,power_law_1.2,0.22417919635772704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,4,1,balanced,0.8156479994455973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,4,1,balanced,0.8200799624125162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,4,1,power_law_1.01,0.7293824195861817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,4,1,power_law_1.01,0.7411968231201171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,4,1,power_law_1.2,0.7536448001861572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,4,1,power_law_1.2,0.7559487819671631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,8,1,balanced,0.4849280118942261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,8,1,balanced,0.48609598477681476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,8,1,power_law_1.01,0.4386303901672363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,8,1,power_law_1.01,0.4425407886505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,8,1,power_law_1.2,0.44760961532592775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2048,8,256,8,1,power_law_1.2,0.44798078536987307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,1,balanced,2.4328959782918296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,1,balanced,2.455514589945475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,1,power_law_1.01,2.312704086303711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,1,power_law_1.01,2.3190784454345703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,1,power_law_1.2,2.337926483154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,1,power_law_1.2,2.364793586730957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,16,balanced,0.27129600445429486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,16,balanced,0.27313599983851117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,16,power_law_1.01,0.28286080360412597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,16,power_law_1.01,0.2874943971633911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,16,power_law_1.2,0.2792383909225464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,16,power_law_1.2,0.2805311918258667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,2,balanced,1.2717066605885823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,2,balanced,1.2797173659006755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,2,power_law_1.01,1.1776384353637694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,2,power_law_1.01,1.225875186920166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,2,power_law_1.2,1.2160639762878418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,2,power_law_1.2,1.232262420654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,32,balanced,0.1788960099220276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,32,balanced,0.1792693336804708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,32,power_law_1.01,0.18021119832992555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,32,power_law_1.01,0.18755199909210205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,32,power_law_1.2,0.1858240008354187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,32,power_law_1.2,0.18642560243606568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,4,balanced,0.6790400346120199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,4,balanced,0.6819519996643066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,4,power_law_1.01,0.6605696201324462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,4,power_law_1.01,0.6768511772155762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,4,power_law_1.2,0.6773248195648194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,4,power_law_1.2,0.7011072158813476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,8,balanced,0.4018079837163289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,8,balanced,0.40220268567403156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,8,power_law_1.01,0.3882047891616821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,8,power_law_1.01,0.38830718994140623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,8,power_law_1.2,0.40661120414733887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,1,8,power_law_1.2,0.41383042335510256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,16,1,balanced,0.2765653332074483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,16,1,balanced,0.2769920031229655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,16,1,power_law_1.01,0.271776008605957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,16,1,power_law_1.01,0.2732223987579346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,16,1,power_law_1.2,0.2739583969116211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,16,1,power_law_1.2,0.2740544080734253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,2,1,balanced,1.2374826272328694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,2,1,balanced,1.2647253672281902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,2,1,power_law_1.01,1.1816831588745118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,2,1,power_law_1.01,1.1949695587158202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,2,1,power_law_1.2,1.183948802947998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,2,1,power_law_1.2,1.18405122756958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,32,1,balanced,0.1954560081164042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,32,1,balanced,0.196015993754069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,32,1,power_law_1.01,0.19230079650878906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,32,1,power_law_1.01,0.1926144003868103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,32,1,power_law_1.2,0.19347200393676758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,32,1,power_law_1.2,0.19500160217285156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,4,1,balanced,0.6506666739781698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,4,1,balanced,0.6572320063908895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,4,1,power_law_1.01,0.6293439865112305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,4,1,power_law_1.01,0.6350783824920654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,4,1,power_law_1.2,0.6271743774414062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,4,1,power_law_1.2,0.641260814666748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,8,1,balanced,0.36722668011983234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,8,1,balanced,0.3680533170700073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,8,1,power_law_1.01,0.35555200576782225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,8,1,power_law_1.01,0.35669760704040526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,8,1,power_law_1.2,0.3635456085205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,6144,2560,8,160,8,1,power_law_1.2,0.3637183904647827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,1,balanced,3.6743253072102866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,1,balanced,3.7146933873494468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,1,power_law_1.01,3.1314239501953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,1,power_law_1.01,3.144723129272461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,1,power_law_1.2,3.2375873565673827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,1,power_law_1.2,3.3023361206054687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,128,balanced,0.20377065738042197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,128,balanced,0.20394132534662882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,128,power_law_1.01,0.20035839080810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,128,power_law_1.01,0.20101120471954345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,128,power_law_1.2,0.20400640964508057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,128,power_law_1.2,0.20526719093322754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,16,balanced,0.4001173178354899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,16,balanced,0.4007306496302287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,16,power_law_1.01,0.3840895891189575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,16,power_law_1.01,0.3906944036483765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,16,power_law_1.2,0.3712383985519409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,16,power_law_1.2,0.3850176095962524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,2,balanced,1.9156427383422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,2,balanced,1.9165226618448894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,2,power_law_1.01,1.615519905090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,2,power_law_1.01,1.6426816940307618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,2,power_law_1.2,1.6771263122558593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,2,power_law_1.2,1.6957120895385742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,256,balanced,0.197269340356191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,256,balanced,0.1991893251736959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,256,power_law_1.01,0.19456640481948853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,256,power_law_1.01,0.19459199905395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,256,power_law_1.2,0.19662079811096192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,256,power_law_1.2,0.19782400131225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,32,balanced,0.26596800486246747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,32,balanced,0.2663840055465698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,32,power_law_1.01,0.24774401187896727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,32,power_law_1.01,0.24778881072998046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,32,power_law_1.2,0.2565056085586548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,32,power_law_1.2,0.2596735954284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,4,balanced,1.0026986598968506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,4,balanced,1.0028053124745686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,4,power_law_1.01,0.9075519561767578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,4,power_law_1.01,0.9240896224975585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,4,power_law_1.2,0.9249088287353515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,4,power_law_1.2,0.9301440238952636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,64,balanced,0.21131734053293863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,64,balanced,0.2119040091832479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,64,power_law_1.01,0.20815999507904054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,64,power_law_1.01,0.2099071979522705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,64,power_law_1.2,0.21105918884277344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,64,power_law_1.2,0.21643519401550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,8,balanced,0.5999626715977987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,8,balanced,0.602133313814799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,8,power_law_1.01,0.5627456188201905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,8,power_law_1.01,0.5702335834503174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,8,power_law_1.2,0.5683135986328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,1,8,power_law_1.2,0.5716608047485352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,16,1,balanced,0.3887519836425781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,16,1,balanced,0.3887626727422078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,16,1,power_law_1.01,0.3502847909927368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,16,1,power_law_1.01,0.36735360622406005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,16,1,power_law_1.2,0.3621567964553833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,16,1,power_law_1.2,0.3747648000717163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,2,1,balanced,1.8619573911031086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,2,1,balanced,1.9458506902058919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,2,1,power_law_1.01,1.6083648681640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,2,1,power_law_1.01,1.6101951599121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,2,1,power_law_1.2,1.6362815856933595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,2,1,power_law_1.2,1.6856128692626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,32,1,balanced,0.269706666469574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,32,1,balanced,0.2707093358039856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,32,1,power_law_1.01,0.2547647953033447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,32,1,power_law_1.01,0.25664639472961426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,32,1,power_law_1.2,0.25742719173431394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,32,1,power_law_1.2,0.2594048023223877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,4,1,balanced,0.9520800113677979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,4,1,balanced,0.9651412963867188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,4,1,power_law_1.01,0.8440320014953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,4,1,power_law_1.01,0.8532480239868164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,4,1,power_law_1.2,0.8848640441894531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,4,1,power_law_1.2,0.9012351989746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,8,1,balanced,0.5681333144505819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,8,1,balanced,0.569482684135437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,8,1,power_law_1.01,0.5167424201965332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,8,1,power_law_1.01,0.5243968009948731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,8,1,power_law_1.2,0.523744010925293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,256,8,1,power_law_1.2,0.540992021560669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,1,balanced,5.503301620483398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,1,balanced,5.605583826700847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,1,power_law_1.01,4.276480102539063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,1,power_law_1.01,4.399660873413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,1,power_law_1.2,4.3784126281738285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,1,power_law_1.2,4.417049789428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,128,balanced,0.2524799903233846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,128,balanced,0.25286932786305744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,128,power_law_1.01,0.2503103971481323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,128,power_law_1.01,0.2508671998977661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,128,power_law_1.2,0.24824960231781007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,128,power_law_1.2,0.24931840896606444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,16,balanced,0.5326559940973917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,16,balanced,0.5352693398793539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,16,power_law_1.01,0.4694528102874756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,16,power_law_1.01,0.4719232082366943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,16,power_law_1.2,0.4930111885070801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,16,power_law_1.2,0.4962495803833008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,2,balanced,2.8132108052571616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,2,balanced,2.817514737447103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,2,power_law_1.01,2.3126848220825194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,2,power_law_1.01,2.3232704162597657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,2,power_law_1.2,2.2275455474853514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,2,power_law_1.2,2.2641408920288084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,32,balanced,0.3757813374201457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,32,balanced,0.3758506774902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,32,power_law_1.01,0.35519359111785886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,32,power_law_1.01,0.3604095935821533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,32,power_law_1.2,0.3510591983795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,32,power_law_1.2,0.35466880798339845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,4,balanced,1.470586617787679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,4,balanced,1.4717119534810383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,4,power_law_1.01,1.2263744354248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,4,power_law_1.01,1.2356672286987305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,4,power_law_1.2,1.2607487678527831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,4,power_law_1.2,1.2668864250183105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,64,balanced,0.27845333019892377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,64,balanced,0.27932266394297284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,64,power_law_1.01,0.2677695989608765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,64,power_law_1.01,0.2711296081542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,64,power_law_1.2,0.26993279457092284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,64,power_law_1.2,0.270796799659729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,8,balanced,0.8444320360819498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,8,balanced,0.8521493275960287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,8,power_law_1.01,0.7442368030548095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,8,power_law_1.01,0.7887360095977783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,8,power_law_1.2,0.7483583927154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,1,8,power_law_1.2,0.7507840156555176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,16,1,balanced,0.5033813317616781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,16,1,balanced,0.5049386819203695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,16,1,power_law_1.01,0.4492095947265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,16,1,power_law_1.01,0.4536320209503174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,16,1,power_law_1.2,0.44756479263305665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,16,1,power_law_1.2,0.4522687911987305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,2,1,balanced,2.6775201161702475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,2,1,balanced,2.68067200978597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,2,1,power_law_1.01,2.199065589904785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,2,1,power_law_1.01,2.2396032333374025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,2,1,power_law_1.2,2.1969087600708006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,2,1,power_law_1.2,2.2292543411254884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,32,1,balanced,0.3661706844965617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,32,1,balanced,0.3670346736907959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,32,1,power_law_1.01,0.328985595703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,32,1,power_law_1.01,0.33130879402160646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,32,1,power_law_1.2,0.3277440071105957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,32,1,power_law_1.2,0.32845439910888674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,4,1,balanced,1.3835093180338542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,4,1,balanced,1.415887991587321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,4,1,power_law_1.01,1.1550399780273437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,4,1,power_law_1.01,1.1775487899780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,4,1,power_law_1.2,1.1523712158203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,4,1,power_law_1.2,1.1554304122924806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,8,1,balanced,0.7991627057393392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,8,1,balanced,0.8006933530171713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,8,1,power_law_1.01,0.659660816192627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,8,1,power_law_1.01,0.6609087944030761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,8,1,power_law_1.2,0.6646527767181396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,320,7168,2048,8,384,8,1,power_law_1.2,0.6723199844360351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,1,balanced,0.2748426596323649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,1,balanced,0.2751893401145935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,1,power_law_1.01,0.28510079383850095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,1,power_law_1.01,0.2861824035644531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,1,power_law_1.2,0.28750081062316896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,1,power_law_1.2,0.28794240951538086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,128,balanced,0.05640000104904175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,128,balanced,0.057802667220433555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,128,power_law_1.01,0.0574400007724762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,128,power_law_1.01,0.05750399827957153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,128,power_law_1.2,0.056992000341415404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,128,power_law_1.2,0.05806080102920532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,16,balanced,0.06688533226648967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,16,balanced,0.06799466907978058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,16,power_law_1.01,0.06593919992446899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,16,power_law_1.01,0.06792320013046264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,16,power_law_1.2,0.06878719925880432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,16,power_law_1.2,0.06880639791488648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,2,balanced,0.14819199840227762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,2,balanced,0.15177067120869955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,2,power_law_1.01,0.15322240591049194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,2,power_law_1.01,0.15734399557113649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,2,power_law_1.2,0.15358079671859742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,2,power_law_1.2,0.15856000185012817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,32,balanced,0.0568800022204717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,32,balanced,0.057914664347966514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,32,power_law_1.01,0.05738880038261414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,32,power_law_1.01,0.058169597387313844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,32,power_law_1.2,0.059443199634552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,32,power_law_1.2,0.060115200281143186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,4,balanced,0.1011786659558614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,4,balanced,0.10197333494822185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,4,power_law_1.01,0.10371199846267701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,4,power_law_1.01,0.10817919969558716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,4,power_law_1.2,0.10900479555130005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,4,power_law_1.2,0.11016319990158081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,64,balanced,0.05690666536490122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,64,balanced,0.058490668733914696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,64,power_law_1.01,0.05745919942855835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,64,power_law_1.01,0.05944960117340088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,64,power_law_1.2,0.0590399980545044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,64,power_law_1.2,0.05978879928588867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,8,balanced,0.07940266529719035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,8,balanced,0.07961066563924153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,8,power_law_1.01,0.07951359748840332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,8,power_law_1.01,0.07985280156135559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,8,power_law_1.2,0.08013439774513245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,1,8,power_law_1.2,0.08125439882278443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,2,1,balanced,0.13928000132242838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,2,1,balanced,0.13974933822949728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,2,1,power_law_1.01,0.1387519955635071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,2,1,power_law_1.01,0.13953280448913574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,2,1,power_law_1.2,0.14623359441757203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,2,1,power_law_1.2,0.15107840299606323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,4,1,balanced,0.09506666660308838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,4,1,balanced,0.09570133686065674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,4,1,power_law_1.01,0.09415680170059204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,4,1,power_law_1.01,0.09464319944381713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,4,1,power_law_1.2,0.10277760028839111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2048,768,8,128,4,1,power_law_1.2,0.10810240507125854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,1,balanced,0.7177866299947103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,1,balanced,0.7315999666849772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,1,power_law_1.01,0.6685567855834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,1,power_law_1.01,0.6725120067596435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,1,power_law_1.2,0.6903744220733643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,1,power_law_1.2,0.6913152217864991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,128,balanced,0.0773226668437322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,128,balanced,0.07824000219504039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,128,power_law_1.01,0.07703040242195129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,128,power_law_1.01,0.07710719704627991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,128,power_law_1.2,0.07788159847259521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,128,power_law_1.2,0.07898880243301391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,16,balanced,0.09637332955996196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,16,balanced,0.09707199533780415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,16,power_law_1.01,0.10057599544525146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,16,power_law_1.01,0.10216959714889526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,16,power_law_1.2,0.10051840543746948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,16,power_law_1.2,0.10149760246276855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,2,balanced,0.3689119815826416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,2,balanced,0.3747733434041341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,2,power_law_1.01,0.35073280334472656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,2,power_law_1.01,0.35620479583740233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,2,power_law_1.2,0.36929919719696047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,2,power_law_1.2,0.36948480606079104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,32,balanced,0.08513599634170532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,32,balanced,0.08654933174451192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,32,power_law_1.01,0.08499199748039246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,32,power_law_1.01,0.08569599986076355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,32,power_law_1.2,0.08851199746131896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,32,power_law_1.2,0.08906880021095276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,4,balanced,0.22103466590245566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,4,balanced,0.22160534063975015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,4,power_law_1.01,0.21032960414886476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,4,power_law_1.01,0.21127679347991943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,4,power_law_1.2,0.2197887897491455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,4,power_law_1.2,0.2211519956588745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,64,balanced,0.08029866715272267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,64,balanced,0.0805866668621699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,64,power_law_1.01,0.0830784022808075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,64,power_law_1.01,0.08342400193214417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,64,power_law_1.2,0.08199040293693542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,64,power_law_1.2,0.08289920091629029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,8,balanced,0.14576533436775208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,8,balanced,0.14595199624697366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,8,power_law_1.01,0.14171520471572877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,8,power_law_1.01,0.14379520416259767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,8,power_law_1.2,0.1479871988296509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,1,8,power_law_1.2,0.14928640127182008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,16,1,balanced,0.22611733277638754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,16,1,balanced,0.22633065780003866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,16,1,power_law_1.01,0.22529280185699463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,16,1,power_law_1.01,0.22603518962860109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,16,1,power_law_1.2,0.2350719928741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,2,1,balanced,0.3564373254776001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,2,1,balanced,0.35742398103078205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,2,1,power_law_1.01,0.34577279090881347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,2,1,power_law_1.01,0.346777606010437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,2,1,power_law_1.2,0.3474112033843994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,2,1,power_law_1.2,0.34817280769348147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,32,1,balanced,0.1941866676012675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,32,1,balanced,0.19493865966796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,32,1,power_law_1.01,0.19368319511413573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,32,1,power_law_1.01,0.19663360118865966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,32,1,power_law_1.2,0.2005631923675537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,32,1,power_law_1.2,0.20151040554046631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,4,1,balanced,0.21211733420689902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,4,1,balanced,0.21386132637659708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,4,1,power_law_1.01,0.20467839241027833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,4,1,power_law_1.01,0.20611200332641602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,4,1,power_law_1.2,0.20892798900604248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,4,1,power_law_1.2,0.2104896068572998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,8,1,balanced,0.3296533425649007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,8,1,balanced,0.33051733175913495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,8,1,power_law_1.01,0.3294015884399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,8,1,power_law_1.01,0.3312896013259888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,8,1,power_law_1.2,0.33406078815460205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,2688,1856,6,128,8,1,power_law_1.2,0.33651840686798096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,1,balanced,1.1658613681793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,1,balanced,1.2047839959462483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,1,power_law_1.01,1.0319295883178712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,1,power_law_1.01,1.0393152236938477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,1,power_law_1.2,1.0608384132385253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,1,power_law_1.2,1.0718208312988282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,128,balanced,0.11333333452542622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,128,balanced,0.11588799953460693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,128,power_law_1.01,0.11403520107269287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,128,power_law_1.01,0.11623680591583252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,128,power_law_1.2,0.11399680376052856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,128,power_law_1.2,0.11649919748306274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,16,balanced,0.17303466796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,16,balanced,0.17384000619252524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,16,power_law_1.01,0.15865600109100342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,16,power_law_1.01,0.1592576026916504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,16,power_law_1.2,0.17229440212249755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,16,power_law_1.2,0.1729920029640198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,2,balanced,0.6358240048090616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,2,balanced,0.641274650891622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,2,power_law_1.01,0.5874048233032226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,2,power_law_1.01,0.593555212020874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,2,power_law_1.2,0.5815680027008057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,2,power_law_1.2,0.594105577468872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,256,balanced,0.11174933115641277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,256,balanced,0.11211733023325603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,256,power_law_1.01,0.11063679456710815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,256,power_law_1.01,0.11110399961471558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,256,power_law_1.2,0.11152640581130982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,256,power_law_1.2,0.1121664047241211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,32,balanced,0.12981866796811423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,32,balanced,0.12985600034395853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,32,power_law_1.01,0.1260159969329834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,32,power_law_1.01,0.12840319871902467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,32,power_law_1.2,0.12863999605178833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,32,power_law_1.2,0.12938239574432372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,4,balanced,0.3747680187225342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,4,balanced,0.37603731950124103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,4,power_law_1.01,0.3596863985061646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,4,power_law_1.01,0.36249599456787107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,4,power_law_1.2,0.3483968019485474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,4,power_law_1.2,0.3515903949737549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,64,balanced,0.11918399731318156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,64,balanced,0.11945066849390666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,64,power_law_1.01,0.1182144045829773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,64,power_law_1.01,0.1189568042755127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,64,power_law_1.2,0.11806720495223999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,64,power_law_1.2,0.11950080394744873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,8,balanced,0.23659199476242065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,8,balanced,0.237936000029246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,8,power_law_1.01,0.21882240772247313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,8,power_law_1.01,0.22067840099334718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,8,power_law_1.2,0.22632319927215577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,1,8,power_law_1.2,0.23189120292663573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,16,1,balanced,0.17217600345611572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,16,1,balanced,0.17421332995096842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,16,1,power_law_1.01,0.16001919507980347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,16,1,power_law_1.01,0.16008319854736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,16,1,power_law_1.2,0.166975998878479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,16,1,power_law_1.2,0.16844799518585205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,2,1,balanced,0.6133493185043335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,2,1,balanced,0.614464004834493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,2,1,power_law_1.01,0.5512447834014893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,2,1,power_law_1.01,0.5658751964569092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,2,1,power_law_1.2,0.5678400039672852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,2,1,power_law_1.2,0.5692736148834229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,32,1,balanced,0.12966932853062949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,32,1,balanced,0.13032000263532004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,32,1,power_law_1.01,0.12438399791717529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,32,1,power_law_1.01,0.12503039836883545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,32,1,power_law_1.2,0.12587519884109497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,32,1,power_law_1.2,0.12635519504547119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,4,1,balanced,0.34754133224487305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,4,1,balanced,0.3477226495742798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,4,1,power_law_1.01,0.3216576099395752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,4,1,power_law_1.01,0.3224639892578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,4,1,power_law_1.2,0.3252928018569946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,4,1,power_law_1.2,0.32993919849395753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,8,1,balanced,0.2140586574872335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,8,1,balanced,0.21439466873804727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,8,1,power_law_1.01,0.20203518867492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,8,1,power_law_1.01,0.20339839458465575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,8,1,power_law_1.2,0.20172159671783446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,3072,1536,8,256,8,1,power_law_1.2,0.2031167984008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,1,balanced,0.7518293062845866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,1,balanced,0.753706693649292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,1,power_law_1.01,0.8595968246459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,1,power_law_1.01,0.8680255889892579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,1,power_law_1.2,0.8212991714477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,1,power_law_1.2,0.8637375831604004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,2,balanced,0.4152853488922119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,2,balanced,0.41578133900960285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,2,power_law_1.01,0.49886717796325686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,2,power_law_1.01,0.5475584030151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,2,power_law_1.2,0.5169983863830566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,2,power_law_1.2,0.5193791866302491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,4,balanced,0.30738667647043866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,4,balanced,0.3118240038553874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,4,power_law_1.01,0.3784447908401489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,4,power_law_1.01,0.3785919904708862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,4,power_law_1.2,0.3628416061401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,4,power_law_1.2,0.3723135948181152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,8,balanced,0.26183466116587323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,8,balanced,0.2634613315264384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,8,power_law_1.01,0.2930624008178711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,8,power_law_1.01,0.31347200870513914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,8,power_law_1.2,0.3157504081726074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,1,8,power_law_1.2,0.3212671995162964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,16,1,balanced,0.09884799520174663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,16,1,balanced,0.09910399715105693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,16,1,power_law_1.01,0.0952127993106842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,16,1,power_law_1.01,0.09539200067520141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,16,1,power_law_1.2,0.09442560076713562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,16,1,power_law_1.2,0.09500160217285156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,2,1,balanced,0.4010239839553833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,2,1,balanced,0.40298668543497723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,2,1,power_law_1.01,0.4166207790374756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,2,1,power_law_1.01,0.4265471935272217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,2,1,power_law_1.2,0.41861758232116697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,2,1,power_law_1.2,0.4325376033782959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,32,1,balanced,0.07788266738255818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,32,1,balanced,0.07853866616884868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,32,1,power_law_1.01,0.08147839903831482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,32,1,power_law_1.01,0.08194559812545776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,32,1,power_law_1.2,0.08072959780693054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,32,1,power_law_1.2,0.08180480003356934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,4,1,balanced,0.23085866371790567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,4,1,balanced,0.2324906587600708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,4,1,power_law_1.01,0.22999680042266846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,4,1,power_law_1.01,0.23420159816741942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,4,1,power_law_1.2,0.22602880001068115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,4,1,power_law_1.2,0.2315648078918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,8,1,balanced,0.15043733517328897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,8,1,balanced,0.15361066659291586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,8,1,power_law_1.01,0.1475711941719055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,8,1,power_law_1.01,0.14929280281066895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,8,1,power_law_1.2,0.14205440282821655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,14336,2,8,8,1,power_law_1.2,0.14777599573135375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,1,balanced,0.7992479801177979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,1,balanced,0.8038079738616943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,1,power_law_1.01,0.8064384460449219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,1,power_law_1.01,0.8087871551513672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,1,power_law_1.2,0.8253503799438476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,1,power_law_1.2,0.841766357421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,128,balanced,0.09752000371615092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,128,balanced,0.10079999764760335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,128,power_law_1.01,0.10056320428848267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,128,power_law_1.01,0.10057599544525146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,128,power_law_1.2,0.10061440467834473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,128,power_law_1.2,0.10150400400161744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,16,balanced,0.12771200140317282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,16,balanced,0.128330667813619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,16,power_law_1.01,0.13233920335769653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,16,power_law_1.01,0.1327679991722107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,16,power_law_1.2,0.13327360153198242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,16,power_law_1.2,0.13905919790267945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,2,balanced,0.4522879918416341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,2,balanced,0.4543519814809163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,2,power_law_1.01,0.4571648120880127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,2,power_law_1.01,0.4576128005981445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,2,power_law_1.2,0.474502420425415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,2,power_law_1.2,0.4807744026184082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,32,balanced,0.11521066228548686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,32,balanced,0.11525866389274597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,32,power_law_1.01,0.11621760129928589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,32,power_law_1.01,0.11745920181274414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,32,power_law_1.2,0.11764479875564575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,32,power_law_1.2,0.11871999502182007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,4,balanced,0.2663946747779846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,4,balanced,0.2681120038032532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,4,power_law_1.01,0.27733759880065917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,4,power_law_1.01,0.28670079708099366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,4,power_law_1.2,0.29009280204772947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,4,power_law_1.2,0.29395840167999265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,64,balanced,0.1107306679089864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,64,balanced,0.1109226644039154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,64,power_law_1.01,0.110316801071167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,64,power_law_1.01,0.11085439920425415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,64,power_law_1.2,0.11144959926605225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,64,power_law_1.2,0.11222399473190307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,8,balanced,0.17892799774805704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,8,balanced,0.17921600739161173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,8,power_law_1.01,0.19181439876556397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,8,power_law_1.01,0.19500800371170043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,8,power_law_1.2,0.1970304012298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,1,8,power_law_1.2,0.1987328052520752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,16,1,balanced,0.13049599528312683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,16,1,balanced,0.13119999567667642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,16,1,power_law_1.01,0.1317247986793518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,16,1,power_law_1.01,0.133024001121521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,16,1,power_law_1.2,0.13388799428939818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,16,1,power_law_1.2,0.13495680093765258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,2,1,balanced,0.5125866731007894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,2,1,balanced,0.5147466659545898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,2,1,power_law_1.01,0.5280064105987549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,2,1,power_law_1.01,0.5321407794952393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,2,1,power_law_1.2,0.5315519809722901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,2,1,power_law_1.2,0.5341184139251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,32,1,balanced,0.11729066570599873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,32,1,balanced,0.11753066380818684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,32,1,power_law_1.01,0.1168768048286438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,32,1,power_law_1.01,0.11762559413909912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,32,1,power_law_1.2,0.11824640035629272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,32,1,power_law_1.2,0.1184000015258789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,4,1,balanced,0.24859732389450073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,4,1,balanced,0.24929600954055786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,4,1,power_law_1.01,0.24827520847320556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,4,1,power_law_1.01,0.2532351970672607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,4,1,power_law_1.2,0.2715456008911133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,4,1,power_law_1.2,0.27489919662475587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,8,1,balanced,0.1643893321355184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,8,1,balanced,0.16497066617012024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,8,1,power_law_1.01,0.1613759994506836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,8,1,power_law_1.01,0.16455039978027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,8,1,power_law_1.2,0.1796223998069763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,1536,8,128,8,1,power_law_1.2,0.18328959941864015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,1,balanced,5.5594024658203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,1,balanced,5.593589146931966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,1,power_law_1.01,5.299238586425782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,1,power_law_1.01,5.327110290527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,1,power_law_1.2,5.405395126342773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,1,power_law_1.2,5.459411239624023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,128,balanced,0.3575626611709595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,128,balanced,0.35869332154591876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,128,power_law_1.01,0.3665472030639648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,128,power_law_1.01,0.36720640659332277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,128,power_law_1.2,0.37322239875793456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,128,power_law_1.2,0.37361280918121337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,16,balanced,0.6622346639633179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,16,balanced,0.6623946825663248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,16,power_law_1.01,0.6411839962005615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,16,power_law_1.01,0.6478591918945312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,16,power_law_1.2,0.6498112201690673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,16,power_law_1.2,0.6525951862335205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,2,balanced,2.978848139444987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,2,balanced,3.007061322530111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,2,power_law_1.01,2.741939163208008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,2,power_law_1.01,2.7648128509521483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,2,power_law_1.2,2.8275007247924804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,2,power_law_1.2,2.874630355834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,256,balanced,0.35386133193969727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,256,balanced,0.35465065638224286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,256,power_law_1.01,0.3587392091751099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,256,power_law_1.01,0.3597759962081909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,256,power_law_1.2,0.3624191999435425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,256,power_law_1.2,0.36250240802764894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,32,balanced,0.493834654490153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,32,balanced,0.49619734287261963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,32,power_law_1.01,0.49488000869750975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,32,power_law_1.01,0.4954368114471436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,32,power_law_1.2,0.5006783962249756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,32,power_law_1.2,0.5034560203552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,4,balanced,1.5875360171000164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,4,balanced,1.6086452802022297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,4,power_law_1.01,1.5117183685302735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,4,power_law_1.01,1.5247936248779297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,4,power_law_1.2,1.4833984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,4,power_law_1.2,1.4870911598205567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,64,balanced,0.3917119900385539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,64,balanced,0.39228800932566327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,64,power_law_1.01,0.40483841896057127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,64,power_law_1.01,0.41558399200439455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,64,power_law_1.2,0.4244991779327393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,64,power_law_1.2,0.4279359817504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,8,balanced,0.9669439792633057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,8,balanced,0.9696586926778158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,8,power_law_1.01,0.9301631927490235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,8,power_law_1.01,0.9470399856567383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,8,power_law_1.2,0.9615551948547363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,1,8,power_law_1.2,0.9665151596069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,16,1,balanced,1.4884319305419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,16,1,balanced,1.4938294092814128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,16,1,power_law_1.01,1.4637311935424804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,16,1,power_law_1.01,1.4763008117675782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,16,1,power_law_1.2,1.511558437347412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,16,1,power_law_1.2,1.5331392288208008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,2,1,balanced,2.7908798853556314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,2,1,balanced,2.805514653523763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,2,1,power_law_1.01,2.7529407501220704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,2,1,power_law_1.01,2.8121664047241213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,2,1,power_law_1.2,2.788326454162598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,2,1,power_law_1.2,2.8072383880615233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,32,1,balanced,1.1845280329386394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,32,1,balanced,1.1850026448567708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,32,1,power_law_1.01,1.1671999931335448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,32,1,power_law_1.01,1.1712960243225097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,32,1,power_law_1.2,1.2202112197875976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,32,1,power_law_1.2,1.2266752243041992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,4,1,balanced,1.6011892954508464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,4,1,balanced,1.6131466229756672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,4,1,power_law_1.01,1.6024703979492188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,4,1,power_law_1.01,1.6207872390747071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,4,1,power_law_1.2,1.6472511291503906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,4,1,power_law_1.2,1.658131217956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,8,1,balanced,0.8167306582132975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,8,1,balanced,0.8202826976776123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,8,1,power_law_1.01,0.7908991813659668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,8,1,power_law_1.01,0.792844820022583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,8,1,power_law_1.2,0.8255104064941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,4096,2688,22,512,8,1,power_law_1.2,0.8268735885620118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,1,balanced,1.3264799912770588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,1,balanced,1.3541760444641113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,1,power_law_1.01,1.3631296157836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,1,power_law_1.01,1.3766271591186523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,1,power_law_1.2,1.3300160408020019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,1,power_law_1.2,1.3507264137268067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,2,balanced,0.6885706583658854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,2,balanced,0.6932960351308187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,2,power_law_1.01,0.8658816337585449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,2,power_law_1.01,0.8741567611694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,2,power_law_1.2,0.8367744445800781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,2,power_law_1.2,0.927455997467041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,4,balanced,0.41228799025217694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,4,balanced,0.41706665356953937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,4,power_law_1.01,0.48226561546325686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,4,power_law_1.01,0.5011583805084229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,4,power_law_1.2,0.48346881866455077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,4,power_law_1.2,0.5130368232727051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,8,balanced,0.3306453426678975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,8,balanced,0.331989328066508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,8,power_law_1.01,0.40191359519958497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,8,power_law_1.01,0.4019711971282959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,8,power_law_1.2,0.40584959983825686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,1,8,power_law_1.2,0.41170558929443357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,16,1,balanced,0.12392533818880717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,16,1,balanced,0.1256480018297831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,16,1,power_law_1.01,0.12343679666519165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,16,1,power_law_1.01,0.12352639436721802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,16,1,power_law_1.2,0.12382719516754151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,16,1,power_law_1.2,0.12440320253372192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,2,1,balanced,0.6080480019251505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,2,1,balanced,0.6224319934844971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,2,1,power_law_1.01,0.6448512077331543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,2,1,power_law_1.01,0.6451072216033935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,2,1,power_law_1.2,0.6302271842956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,2,1,power_law_1.2,0.6407551765441895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,32,1,balanced,0.10874666770299275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,32,1,balanced,0.10898666580518086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,32,1,power_law_1.01,0.10600320100784302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,32,1,power_law_1.01,0.10643199682235718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,32,1,power_law_1.2,0.10588159561157226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,32,1,power_law_1.2,0.1068608045578003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,4,1,balanced,0.33585600058237713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,4,1,balanced,0.33659199873606366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,4,1,power_law_1.01,0.3365823984146118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,4,1,power_law_1.01,0.3393280029296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,4,1,power_law_1.2,0.3314111948013306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,4,1,power_law_1.2,0.3385535955429077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,8,1,balanced,0.20625066757202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,8,1,balanced,0.20933334032694498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,8,1,power_law_1.01,0.20709118843078614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,8,1,power_law_1.01,0.2073215961456299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,8,1,power_law_1.2,0.20441598892211915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,16384,2,8,8,1,power_law_1.2,0.20458879470825195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,1,balanced,3.1508426666259766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,1,balanced,3.2290932337443032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,1,power_law_1.01,2.764409637451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,1,power_law_1.01,2.793094444274902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,1,power_law_1.2,2.8254079818725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,1,power_law_1.2,2.8449792861938477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,128,balanced,0.1867520014444987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,128,balanced,0.18689066171646118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,128,power_law_1.01,0.1851263999938965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,128,power_law_1.01,0.18585599660873414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,128,power_law_1.2,0.18738559484481812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,128,power_law_1.2,0.18819199800491332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,16,balanced,0.3482079903284709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,16,balanced,0.3491520086924235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,16,power_law_1.01,0.33746559619903566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,16,power_law_1.01,0.34168319702148436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,16,power_law_1.2,0.3334208011627197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,16,power_law_1.2,0.339737606048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,2,balanced,1.6302026112874348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,2,balanced,1.6566720008850098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,2,power_law_1.01,1.4141568183898925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,2,power_law_1.01,1.4407999992370606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,2,power_law_1.2,1.4528127670288087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,2,power_law_1.2,1.4940223693847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,256,balanced,0.18056533734003702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,256,balanced,0.1813973387082418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,256,power_law_1.01,0.1810495972633362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,256,power_law_1.01,0.18172800540924072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,256,power_law_1.2,0.18112000226974487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,256,power_law_1.2,0.18220160007476807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,32,balanced,0.23226666450500488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,32,balanced,0.23305600881576538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,32,power_law_1.01,0.22570879459381105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,32,power_law_1.01,0.2335871934890747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,32,power_law_1.2,0.24411520957946778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,32,power_law_1.2,0.2481920003890991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,4,balanced,0.8683679898579916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,4,balanced,0.869429349899292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,4,power_law_1.01,0.816864013671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,4,power_law_1.01,0.8249471664428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,4,power_law_1.2,0.7876031875610352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,4,power_law_1.2,0.8273152351379395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,64,balanced,0.1917333404223124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,64,balanced,0.19592533508936563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,64,power_law_1.01,0.19278719425201415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,64,power_law_1.01,0.1935744047164917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,64,power_law_1.2,0.1955135941505432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,64,power_law_1.2,0.198361599445343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,8,balanced,0.5211093425750732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,8,balanced,0.5219946702321371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,8,power_law_1.01,0.48820481300354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,8,power_law_1.01,0.5101823806762695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,8,power_law_1.2,0.4955904006958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,1,8,power_law_1.2,0.4956223964691162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,16,1,balanced,0.34035201867421466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,16,1,balanced,0.3413120110829671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,16,1,power_law_1.01,0.3066112041473389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,16,1,power_law_1.01,0.31493120193481444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,16,1,power_law_1.2,0.32792959213256834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,16,1,power_law_1.2,0.32803199291229246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,2,1,balanced,1.608565330505371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,2,1,balanced,1.6097280184427898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,2,1,power_law_1.01,1.4131967544555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,2,1,power_law_1.01,1.415174388885498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,2,1,power_law_1.2,1.436076831817627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,2,1,power_law_1.2,1.4415231704711915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,32,1,balanced,0.2396906614303589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,32,1,balanced,0.24087466796239218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,32,1,power_law_1.01,0.22736639976501466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,32,1,power_law_1.01,0.2275775909423828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,32,1,power_law_1.2,0.23219199180603028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,32,1,power_law_1.2,0.23281919956207275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,4,1,balanced,0.8221866289774576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,4,1,balanced,0.8265226682027181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,4,1,power_law_1.01,0.7498239994049072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,4,1,power_law_1.01,0.7567039966583252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,4,1,power_law_1.2,0.7733312129974366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,4,1,power_law_1.2,0.7826560020446778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,8,1,balanced,0.49077868461608887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,8,1,balanced,0.4921226501464844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,8,1,power_law_1.01,0.45613441467285154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,8,1,power_law_1.01,0.4646656036376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,8,1,power_law_1.2,0.4692863941192627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2048,8,256,8,1,power_law_1.2,0.47175040245056155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,1,balanced,2.481104056040446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,1,balanced,2.498666604359945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,1,power_law_1.01,2.402668762207031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,1,power_law_1.01,2.4177215576171873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,1,power_law_1.2,2.3929727554321287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,1,power_law_1.2,2.4026880264282227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,16,balanced,0.2842186689376831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,16,balanced,0.28442132472991943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,16,power_law_1.01,0.2953792095184326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,16,power_law_1.01,0.2965183973312378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,16,power_law_1.2,0.28307840824127195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,16,power_law_1.2,0.28928000926971437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,2,balanced,1.2676160335540771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,2,balanced,1.292629321416219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,2,power_law_1.01,1.2588671684265136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,2,power_law_1.01,1.2647232055664062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,2,power_law_1.2,1.2514240264892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,2,power_law_1.2,1.2974528312683105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,32,balanced,0.18685867389043173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,32,balanced,0.18706132968266806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,32,power_law_1.01,0.1926911950111389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,32,power_law_1.01,0.19742079973220825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,32,power_law_1.2,0.20962560176849365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,32,power_law_1.2,0.21758720874786378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,4,balanced,0.6904426415761312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,4,balanced,0.6912586688995361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,4,power_law_1.01,0.6944255828857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,4,power_law_1.01,0.7105472087860107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,4,power_law_1.2,0.7176896095275879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,4,power_law_1.2,0.7327295780181885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,8,balanced,0.4137973388036092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,8,balanced,0.4149973392486572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,8,power_law_1.01,0.421235179901123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,8,power_law_1.01,0.43930878639221194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,8,power_law_1.2,0.4313471794128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,1,8,power_law_1.2,0.4402815818786621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,16,1,balanced,0.2813919981320699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,16,1,balanced,0.2816266616185506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,16,1,power_law_1.01,0.27971839904785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,16,1,power_law_1.01,0.28042240142822267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,16,1,power_law_1.2,0.27999999523162844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,16,1,power_law_1.2,0.28171520233154296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,2,1,balanced,1.2645760377248128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,2,1,balanced,1.2785066763559978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,2,1,power_law_1.01,1.1956159591674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,2,1,power_law_1.01,1.220032024383545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,2,1,power_law_1.2,1.2032768249511718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,2,1,power_law_1.2,1.2334527969360352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,32,1,balanced,0.20021865765253702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,32,1,balanced,0.20042665799458823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,32,1,power_law_1.01,0.20013439655303955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,32,1,power_law_1.01,0.20093441009521484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,32,1,power_law_1.2,0.2020672082901001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,32,1,power_law_1.2,0.20246400833129882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,4,1,balanced,0.6594346761703491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,4,1,balanced,0.6654933293660482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,4,1,power_law_1.01,0.639577579498291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,4,1,power_law_1.01,0.642086410522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,4,1,power_law_1.2,0.6466047763824463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,4,1,power_law_1.2,0.661843204498291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,8,1,balanced,0.373418649037679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,8,1,power_law_1.01,0.36542720794677735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,8,1,power_law_1.01,0.3696000099182129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,8,1,power_law_1.2,0.3829632043838501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,6144,2560,8,160,8,1,power_law_1.2,0.3897408008575439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,1,balanced,3.68120543162028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,1,balanced,3.728368123372396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,1,power_law_1.01,3.2118656158447267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,1,power_law_1.01,3.2122943878173826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,1,power_law_1.2,3.3219070434570312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,1,power_law_1.2,3.3966079711914063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,128,balanced,0.20987733205159506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,128,balanced,0.2102666695912679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,128,power_law_1.01,0.20940160751342773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,128,power_law_1.01,0.21125121116638185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,128,power_law_1.2,0.21225600242614745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,128,power_law_1.2,0.2150144100189209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,16,balanced,0.4091840187708537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,16,balanced,0.4110986789067586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,16,power_law_1.01,0.3959872007369995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,16,power_law_1.01,0.39601280689239504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,16,power_law_1.2,0.377292799949646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,16,power_law_1.2,0.38877439498901367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,2,balanced,1.935856024424235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,2,balanced,1.9373653729756672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,2,power_law_1.01,1.6577280044555665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,2,power_law_1.01,1.703251266479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,2,power_law_1.2,1.7427007675170898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,2,power_law_1.2,1.7534912109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,256,balanced,0.2055093248685201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,256,balanced,0.20785599946975708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,256,power_law_1.01,0.20453119277954102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,256,power_law_1.01,0.204966402053833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,256,power_law_1.2,0.20414719581604004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,256,power_law_1.2,0.20527999401092528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,32,balanced,0.27534399429957074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,32,balanced,0.27560534079869586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,32,power_law_1.01,0.2670975923538208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,32,power_law_1.01,0.2674623966217041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,32,power_law_1.2,0.2712831974029541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,32,power_law_1.2,0.27692160606384275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,4,balanced,1.0103413263956706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,4,balanced,1.0111680030822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,4,power_law_1.01,0.9265600204467773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,4,power_law_1.01,0.9614784240722656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,4,power_law_1.2,0.9477952003479004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,4,power_law_1.2,0.9556351661682129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,64,balanced,0.2202720046043396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,64,balanced,0.22071999311447144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,64,power_law_1.01,0.22095999717712403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,64,power_law_1.01,0.22373759746551514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,64,power_law_1.2,0.22243199348449708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,64,power_law_1.2,0.22260479927062987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,8,balanced,0.6074986855189005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,8,balanced,0.6110080083211263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,8,power_law_1.01,0.5365759849548339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,8,power_law_1.01,0.5696767807006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,8,power_law_1.2,0.5683712005615235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,1,8,power_law_1.2,0.5849408149719239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,16,1,balanced,0.3940800031026204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,16,1,balanced,0.3946293195088704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,16,1,power_law_1.01,0.3641599893569946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,16,1,power_law_1.01,0.36521599292755125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,16,1,power_law_1.2,0.37423999309539796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,16,1,power_law_1.2,0.38108799457550047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,2,1,balanced,1.862287998199463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,2,1,balanced,1.9233652750651042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,2,1,power_law_1.01,1.6371328353881835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,2,1,power_law_1.01,1.6635839462280273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,2,1,power_law_1.2,1.697555160522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,2,1,power_law_1.2,1.7161855697631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,32,1,balanced,0.2738986611366272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,32,1,balanced,0.2760106722513835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,32,1,power_law_1.01,0.26379520893096925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,32,1,power_law_1.01,0.2641792058944702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,32,1,power_law_1.2,0.26645760536193847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,32,1,power_law_1.2,0.26716160774230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,4,1,balanced,0.956010659535726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,4,1,balanced,0.9728586673736572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,4,1,power_law_1.01,0.8863167762756348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,4,1,power_law_1.01,0.8948479652404785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,4,1,power_law_1.2,0.8958911895751953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,4,1,power_law_1.2,0.9024448394775391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,8,1,balanced,0.5743093490600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,8,1,balanced,0.5750826597213745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,8,1,power_law_1.01,0.5302207946777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,8,1,power_law_1.01,0.5398335933685303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,8,1,power_law_1.2,0.5422719955444336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,256,8,1,power_law_1.2,0.5458559989929199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,1,balanced,5.546362559000651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,1,balanced,5.5708052317301435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,1,power_law_1.01,4.470924758911133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,1,power_law_1.01,4.482432174682617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,1,power_law_1.2,4.527129745483398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,1,power_law_1.2,4.545830535888672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,128,balanced,0.2625066637992859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,128,balanced,0.2635306715965271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,128,power_law_1.01,0.25919361114501954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,128,power_law_1.01,0.26007680892944335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,128,power_law_1.2,0.25897600650787356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,128,power_law_1.2,0.26060800552368163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,16,balanced,0.5439786513646444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,16,balanced,0.5483946800231934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,16,power_law_1.01,0.4880767822265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,16,power_law_1.01,0.49018239974975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,16,power_law_1.2,0.5023871898651123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,16,power_law_1.2,0.5114048004150391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,2,balanced,2.8213494618733725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,2,balanced,2.84006404876709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,2,power_law_1.01,2.314054489135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,2,power_law_1.01,2.352479934692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,2,power_law_1.2,2.361209678649902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,2,power_law_1.2,2.386515235900879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,32,balanced,0.3853333393732707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,32,balanced,0.3878399928410848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,32,power_law_1.01,0.3533375978469849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,32,power_law_1.01,0.35920000076293945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,32,power_law_1.2,0.3514688014984131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,32,power_law_1.2,0.3748863935470581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,4,balanced,1.4817546208699544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,4,balanced,1.4840480486551921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,4,power_law_1.01,1.255014419555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,4,power_law_1.01,1.2646656036376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,4,power_law_1.2,1.2187456130981444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,4,power_law_1.2,1.2293888092041017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,64,balanced,0.2882026632626851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,64,balanced,0.2890506585439046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,64,power_law_1.01,0.28062078952789304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,64,power_law_1.01,0.2854399919509888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,64,power_law_1.2,0.28555519580841066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,64,power_law_1.2,0.2890624046325684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,8,balanced,0.8560053507486979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,8,balanced,0.8622720241546631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,8,power_law_1.01,0.7483967781066895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,8,power_law_1.01,0.7904128074645996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,8,power_law_1.2,0.7455039978027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,1,8,power_law_1.2,0.746227216720581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,16,1,balanced,0.5090293486913046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,16,1,balanced,0.5117119948069254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,16,1,power_law_1.01,0.4611519813537598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,16,1,power_law_1.01,0.4639296054840088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,16,1,power_law_1.2,0.45800957679748533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,16,1,power_law_1.2,0.46236162185668944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,2,1,balanced,2.6966028213500977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,2,1,balanced,2.7343521118164062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,2,1,power_law_1.01,2.2678592681884764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,2,1,power_law_1.01,2.2770431518554686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,2,1,power_law_1.2,2.283807945251465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,2,1,power_law_1.2,2.319808006286621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,32,1,balanced,0.37138132254282635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,32,1,balanced,0.37167465686798096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,32,1,power_law_1.01,0.3362623929977417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,32,1,power_law_1.01,0.338483190536499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,32,1,power_law_1.2,0.33666560649871824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,32,1,power_law_1.2,0.34031999111175537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,4,1,balanced,1.393664042154948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,4,1,balanced,1.4392639795939128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,4,1,power_law_1.01,1.19551362991333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,4,1,power_law_1.01,1.199014377593994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,4,1,power_law_1.2,1.1712703704833984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,4,1,power_law_1.2,1.1957951545715333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,8,1,balanced,0.8055360317230225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,8,1,balanced,0.8060746987660726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,8,1,power_law_1.01,0.6776383876800537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,8,1,power_law_1.01,0.6833920001983642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,8,1,power_law_1.2,0.6736959934234619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,384,7168,2048,8,384,8,1,power_law_1.2,0.6796607971191406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,1,balanced,0.06545599798361461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,1,balanced,0.0656160016854604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,1,power_law_1.01,0.06390399932861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,1,power_law_1.01,0.06435840129852295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,1,power_law_1.2,0.05944960117340088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,1,power_law_1.2,0.062028801441192626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,128,balanced,0.027376001079877216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,128,balanced,0.029365333418051403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,128,power_law_1.01,0.026694399118423463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,128,power_law_1.01,0.027244800329208375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,128,power_law_1.2,0.026233598589897156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,128,power_law_1.2,0.027820798754692077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,16,balanced,0.029333333174387615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,16,balanced,0.029477333029111225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,16,power_law_1.01,0.03245440125465393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,16,power_law_1.01,0.03275519907474518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,16,power_law_1.2,0.033139199018478394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,16,power_law_1.2,0.033318400382995605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,2,balanced,0.05317866802215576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,2,balanced,0.05651199817657471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,2,power_law_1.01,0.06303359866142273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,2,power_law_1.01,0.06417279839515685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,2,power_law_1.2,0.053401601314544675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,2,power_law_1.2,0.05777919888496399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,32,balanced,0.027322667340437572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,32,balanced,0.029461334149042766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,32,power_law_1.01,0.028486400842666626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,32,power_law_1.01,0.028780800104141236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,32,power_law_1.2,0.027590399980545043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,32,power_law_1.2,0.02842240035533905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,4,balanced,0.03522666543722153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,4,balanced,0.03702933341264725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,4,power_law_1.01,0.04056960046291351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,4,power_law_1.01,0.05578240156173706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,4,power_law_1.2,0.04748800098896026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,4,power_law_1.2,0.048332801461219786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,64,balanced,0.02749866743882497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,64,balanced,0.02914133419593175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,64,power_law_1.01,0.026931199431419372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,64,power_law_1.01,0.02715519964694977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,64,power_law_1.2,0.02698880136013031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,64,power_law_1.2,0.027212798595428467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,8,balanced,0.02943466603755951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,8,balanced,0.029882666965325672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,8,power_law_1.01,0.041536000370979306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,8,power_law_1.01,0.04407039880752563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,8,power_law_1.2,0.03966720104217529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,1,8,power_law_1.2,0.04090240001678467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,2,1,balanced,0.04682666560014089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,2,1,balanced,0.047093331813812256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,2,1,power_law_1.01,0.04477440118789673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,2,1,power_law_1.01,0.04639999866485596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,2,1,power_law_1.2,0.042131200432777405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,2,1,power_law_1.2,0.04353919923305512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,4,1,balanced,0.03538133452335993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,4,1,balanced,0.03541333228349686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,4,1,power_law_1.01,0.034246399998664856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,4,1,power_law_1.01,0.03466239869594574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,4,1,power_law_1.2,0.03452160060405731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2048,768,8,128,4,1,power_law_1.2,0.03452799916267395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,1,balanced,0.13823466499646506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,1,balanced,0.13920533657073975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,1,power_law_1.01,0.13804160356521605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,1,power_law_1.01,0.13818880319595336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,1,power_law_1.2,0.13642879724502563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,1,power_law_1.2,0.13719680309295654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,128,balanced,0.033333333830038704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,128,balanced,0.033573334415753685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,128,power_law_1.01,0.031167998909950256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,128,power_law_1.01,0.03178240060806274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,128,power_law_1.2,0.03159680068492889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,128,power_law_1.2,0.03184640109539032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,16,balanced,0.03741333385308584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,16,balanced,0.03847466657559077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,16,power_law_1.01,0.06046079993247986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,16,power_law_1.01,0.06155520081520081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,16,power_law_1.2,0.061561602354049685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,16,power_law_1.2,0.06673920154571533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,2,balanced,0.09044266740481059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,2,balanced,0.09120532870292664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,2,power_law_1.01,0.10513919591903687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,2,power_law_1.01,0.10747519731521607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,2,power_law_1.2,0.1063040018081665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,2,power_law_1.2,0.11293439865112305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,32,balanced,0.03329066683848699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,32,balanced,0.033344000577926636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,32,power_law_1.01,0.0459199994802475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,32,power_law_1.01,0.046598398685455324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,32,power_law_1.2,0.04657920002937317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,32,power_law_1.2,0.04757120013237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,4,balanced,0.05718400080998739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,4,balanced,0.05815466741720835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,4,power_law_1.01,0.08379520177841186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,4,power_law_1.01,0.08822399973869324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,4,power_law_1.2,0.08394240140914917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,4,power_law_1.2,0.0883840024471283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,64,balanced,0.0329120010137558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,64,balanced,0.03356799980004629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,64,power_law_1.01,0.03540480136871338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,64,power_law_1.01,0.0357120007276535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,64,power_law_1.2,0.035724800825119016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,64,power_law_1.2,0.036620798707008365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,8,balanced,0.04142399877309799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,8,balanced,0.04164800047874451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,8,power_law_1.01,0.0670144021511078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,8,power_law_1.01,0.08008319735527039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,8,power_law_1.2,0.07901440262794494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,1,8,power_law_1.2,0.081632000207901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,16,1,balanced,0.047882666190465294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,16,1,balanced,0.04805333415667216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,16,1,power_law_1.01,0.050361597537994386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,16,1,power_law_1.01,0.051020801067352295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,16,1,power_law_1.2,0.05245440006256104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,16,1,power_law_1.2,0.05261440277099609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,2,1,balanced,0.08224000036716461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,2,1,balanced,0.0844586690266927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,2,1,power_law_1.01,0.08122239708900451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,2,1,power_law_1.01,0.08150399923324585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,2,1,power_law_1.2,0.08186879754066467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,2,1,power_law_1.2,0.08212479948997498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,32,1,balanced,0.04780266682306925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,32,1,balanced,0.047968000173568726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,32,1,power_law_1.01,0.04721280038356781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,32,1,power_law_1.01,0.04809600114822388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,32,1,power_law_1.2,0.04734080135822296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,32,1,power_law_1.2,0.04741120040416717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,4,1,balanced,0.05427733560403188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,4,1,balanced,0.05442133545875549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,4,1,power_law_1.01,0.052198398113250735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,4,1,power_law_1.01,0.05237759947776795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,4,1,power_law_1.2,0.05184000134468079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,4,1,power_law_1.2,0.052767997980117796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,8,1,balanced,0.06425066788991292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,8,1,balanced,0.06635733445485432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,8,1,power_law_1.01,0.06743680238723755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,8,1,power_law_1.01,0.06805760264396668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,8,1,power_law_1.2,0.0671999990940094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,2688,1856,6,128,8,1,power_law_1.2,0.06762880086898804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,1,balanced,0.16196266810099283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,1,balanced,0.16455466548601785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,1,power_law_1.01,0.15918079614639283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,1,power_law_1.01,0.16163840293884277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,1,power_law_1.2,0.1603327989578247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,1,power_law_1.2,0.16654720306396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,128,balanced,0.03319466610749563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,128,balanced,0.03323200096686681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,128,power_law_1.01,0.032128000259399415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,128,power_law_1.01,0.0321727991104126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,128,power_law_1.2,0.031999999284744264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,128,power_law_1.2,0.032307198643684386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,16,balanced,0.03346666693687439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,16,balanced,0.03366400053103765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,16,power_law_1.01,0.09494400024414062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,16,power_law_1.01,0.09524480104446412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,16,power_law_1.2,0.0843455970287323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,16,power_law_1.2,0.09325439929962158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,2,balanced,0.09682133793830872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,2,balanced,0.09731200337409973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,2,power_law_1.01,0.132697594165802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,2,power_law_1.01,0.13441920280456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,2,power_law_1.2,0.12878079414367677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,2,power_law_1.2,0.1308608055114746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,256,balanced,0.03329066683848699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,256,balanced,0.03349333256483078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,256,power_law_1.01,0.03142400085926056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,256,power_law_1.01,0.03160960078239441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,256,power_law_1.2,0.03113600015640259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,256,power_law_1.2,0.031718400120735166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,32,balanced,0.03362133353948593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,32,balanced,0.03368533402681351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,32,power_law_1.01,0.059552001953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,32,power_law_1.01,0.060159999132156375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,32,power_law_1.2,0.05901439785957337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,32,power_law_1.2,0.0599295973777771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,4,balanced,0.06417066852251689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,4,balanced,0.06597866614659627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,4,power_law_1.01,0.11588480472564697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,4,power_law_1.01,0.12145919799804687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,4,power_law_1.2,0.10544639825820923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,4,power_law_1.2,0.11258879899978638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,64,balanced,0.033200000723203026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,64,balanced,0.03349866718053818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,64,power_law_1.01,0.044844800233840944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,64,power_law_1.01,0.04583680033683777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,64,power_law_1.2,0.04575360119342804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,64,power_law_1.2,0.045817598700523376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,8,balanced,0.04782933493455251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,8,power_law_1.01,0.10406399965286255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,8,power_law_1.01,0.12050559520721435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,8,power_law_1.2,0.09856640100479126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,1,8,power_law_1.2,0.10300159454345703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,16,1,balanced,0.03421866645415624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,16,1,balanced,0.03499733408292135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,16,1,power_law_1.01,0.03570559918880463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,16,1,power_law_1.01,0.03597440123558045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,16,1,power_law_1.2,0.03619840145111084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,16,1,power_law_1.2,0.03649280071258545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,2,1,balanced,0.09366400043169658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,2,1,balanced,0.09514133135477702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,2,1,power_law_1.01,0.09089279770851136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,2,1,power_law_1.01,0.0915391981601715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,2,1,power_law_1.2,0.0908415973186493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,2,1,power_law_1.2,0.09181439876556396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,32,1,balanced,0.03508266558249792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,32,1,balanced,0.0353973334034284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,32,1,power_law_1.01,0.03378559947013855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,32,1,power_law_1.01,0.03421440124511719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,32,1,power_law_1.2,0.034355199337005614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,32,1,power_law_1.2,0.03480960130691528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,4,1,balanced,0.05809600154558817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,4,1,balanced,0.058101331194241844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,4,1,power_law_1.01,0.057120001316070555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,4,1,power_law_1.01,0.05794559717178345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,4,1,power_law_1.2,0.05735679864883423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,4,1,power_law_1.2,0.05751039981842041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,8,1,balanced,0.043882668018341064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,8,1,balanced,0.04452266792456309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,8,1,power_law_1.01,0.04366079866886139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,8,1,power_law_1.01,0.04407680034637451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,8,1,power_law_1.2,0.04364160001277924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,3072,1536,8,256,8,1,power_law_1.2,0.04374400079250336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,1,balanced,0.47467199961344403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,1,balanced,0.4793440103530884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,1,power_law_1.01,0.22935678958892822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,1,power_law_1.01,0.24007039070129393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,1,power_law_1.2,0.25167999267578123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,1,power_law_1.2,0.2962048053741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,2,balanced,0.24489066998163858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,2,balanced,0.2494879961013794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,2,power_law_1.01,0.1703871965408325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,2,power_law_1.01,0.19694080352783203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,2,power_law_1.2,0.19765119552612304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,2,power_law_1.2,0.20235519409179686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,4,balanced,0.17388800779978433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,4,balanced,0.17489065726598105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,4,power_law_1.01,0.1309183955192566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,4,power_law_1.01,0.1409343957901001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,4,power_law_1.2,0.1195520043373108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,4,power_law_1.2,0.1500864028930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,8,balanced,0.11050132910410564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,8,balanced,0.11265066266059875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,8,power_law_1.01,0.10940159559249878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,8,power_law_1.01,0.11030399799346924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,8,power_law_1.2,0.10870399475097656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,1,8,power_law_1.2,0.11019519567489625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,16,1,balanced,0.056015998125076294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,16,1,balanced,0.056218668818473816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,16,1,power_law_1.01,0.03782399892807007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,16,1,power_law_1.01,0.03880960047245026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,16,1,power_law_1.2,0.03658879995346069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,16,1,power_law_1.2,0.03850879967212677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,2,1,balanced,0.2506986657778422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,2,1,balanced,0.2553333242734273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,2,1,power_law_1.01,0.14094079732894899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,2,1,power_law_1.01,0.1503167986869812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,2,1,power_law_1.2,0.1372928023338318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,2,1,power_law_1.2,0.17994879484176635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,32,1,balanced,0.03533333291610082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,32,1,balanced,0.039173332353432976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,32,1,power_law_1.01,0.03061760067939758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,32,1,power_law_1.01,0.031142398715019226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,32,1,power_law_1.2,0.031040000915527343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,32,1,power_law_1.2,0.03185279965400696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,4,1,balanced,0.14312533537546793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,4,1,balanced,0.15941333770751953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,4,1,power_law_1.01,0.0849727988243103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,4,1,power_law_1.01,0.08724480271339416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,4,1,power_law_1.2,0.08375040292739869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,4,1,power_law_1.2,0.091212797164917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,8,1,balanced,0.09559999903043111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,8,1,balanced,0.097653329372406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,8,1,power_law_1.01,0.05432959794998169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,8,1,power_law_1.01,0.056505602598190305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,8,1,power_law_1.2,0.05431039929389954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,14336,2,8,8,1,power_law_1.2,0.05478399991989136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,1,balanced,0.20995734135309854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,1,balanced,0.21024000644683838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,1,power_law_1.01,0.20515201091766358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,1,power_law_1.01,0.20654079914093018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,1,power_law_1.2,0.20229759216308593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,1,power_law_1.2,0.20431358814239503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,128,balanced,0.03543466577927271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,128,balanced,0.037248000502586365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,128,power_law_1.01,0.03410559892654419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,128,power_law_1.01,0.03430399894714355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,128,power_law_1.2,0.03411200046539307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,128,power_law_1.2,0.03432320058345795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,16,balanced,0.03885333240032196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,16,balanced,0.039359999199708305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,16,power_law_1.01,0.07503359913825988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,16,power_law_1.01,0.07579519748687744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,16,power_law_1.2,0.07184640169143677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,16,power_law_1.2,0.07653759717941284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,2,balanced,0.12636267145474753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,2,balanced,0.12846400340398154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,2,power_law_1.01,0.14728319644927979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,2,power_law_1.01,0.15161600112915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,2,power_law_1.2,0.1285823941230774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,2,power_law_1.2,0.13304320573806763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,32,balanced,0.035504000882307686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,32,balanced,0.0355679988861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,32,power_law_1.01,0.05273600220680237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,32,power_law_1.01,0.05377280116081238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,32,power_law_1.2,0.0494271993637085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,32,power_law_1.2,0.05203199982643127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,4,balanced,0.07778666913509369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,4,balanced,0.08327466746171315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,4,power_law_1.01,0.11119359731674194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,4,power_law_1.01,0.11640959978103638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,4,power_law_1.2,0.10403200387954711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,4,power_law_1.2,0.10743680000305175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,64,balanced,0.03421866645415624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,64,balanced,0.035391998787721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,64,power_law_1.01,0.037190398573875426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,64,power_law_1.01,0.03767040073871612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,64,power_law_1.2,0.0361407995223999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,64,power_law_1.2,0.03661440014839172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,8,balanced,0.05395199855168661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,8,balanced,0.05531733234723409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,8,power_law_1.01,0.09498879909515381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,8,power_law_1.01,0.1090880036354065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,8,power_law_1.2,0.09052159786224365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,1,8,power_law_1.2,0.1064255952835083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,16,1,balanced,0.04160533348719279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,16,1,balanced,0.04301333427429199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,16,1,power_law_1.01,0.042361599206924436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,16,1,power_law_1.01,0.04287360012531281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,16,1,power_law_1.2,0.04268159866333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,16,1,power_law_1.2,0.0433023989200592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,2,1,balanced,0.12601066629091898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,2,1,balanced,0.1274773379166921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,2,1,power_law_1.01,0.11635199785232545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,2,1,power_law_1.01,0.11770880222320557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,2,1,power_law_1.2,0.11185280084609986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,2,1,power_law_1.2,0.11333119869232178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,32,1,balanced,0.039749334255854286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,32,1,balanced,0.03982933362325033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,32,1,power_law_1.01,0.04123519957065582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,32,1,power_law_1.01,0.04139519929885864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,32,1,power_law_1.2,0.041382399201393125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,32,1,power_law_1.2,0.04147840142250061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,4,1,balanced,0.07183466851711273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,4,1,balanced,0.07384000221888225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,4,1,power_law_1.01,0.0707647979259491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,4,1,power_law_1.01,0.07180160284042358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,4,1,power_law_1.2,0.06871039867401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,4,1,power_law_1.2,0.07032960057258605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,8,1,balanced,0.055029332637786865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,8,1,balanced,0.05541866521040598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,8,1,power_law_1.01,0.05381760001182556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,8,1,power_law_1.01,0.05427200198173523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,8,1,power_law_1.2,0.052767997980117796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,1536,8,128,8,1,power_law_1.2,0.05278720259666443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,1,balanced,0.8540693124135336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,1,balanced,0.8558932940165201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,1,power_law_1.01,0.8537343978881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,1,power_law_1.01,0.8555071830749512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,1,power_law_1.2,0.8530048370361328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,1,power_law_1.2,0.8557567596435547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,128,balanced,0.03956799954175949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,128,balanced,0.04151466737190882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,128,power_law_1.01,0.07258880138397217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,128,power_law_1.01,0.07386239767074584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,128,power_law_1.2,0.07208960056304932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,128,power_law_1.2,0.07299839854240417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,16,balanced,0.12024533748626709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,16,balanced,0.12133333086967468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,16,power_law_1.01,0.33050239086151123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,16,power_law_1.01,0.33649280071258547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,16,power_law_1.2,0.333516788482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,16,power_law_1.2,0.3409728050231934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,2,balanced,0.4617280165354411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,2,balanced,0.46241601308186847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,2,power_law_1.01,0.5674496173858643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,2,power_law_1.01,0.6180736064910889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,2,power_law_1.2,0.603379201889038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,2,power_law_1.2,0.6278336048126221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,256,balanced,0.03965333352486292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,256,balanced,0.04171200096607208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,256,power_law_1.01,0.05559679865837097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,256,power_law_1.01,0.05576320290565491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,256,power_law_1.2,0.05539199709892273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,256,power_law_1.2,0.055622398853302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,32,balanced,0.08264533181985219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,32,balanced,0.08461866776148479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,32,power_law_1.01,0.1985919952392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,32,power_law_1.01,0.1992576003074646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,32,power_law_1.2,0.19771519899368287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,32,power_law_1.2,0.19893759489059448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,4,balanced,0.26817067464192706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,4,balanced,0.2686079939206441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,4,power_law_1.01,0.4493375778198242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,4,power_law_1.01,0.48832001686096194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,4,power_law_1.2,0.43948798179626464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,4,power_law_1.2,0.4512959957122803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,64,balanced,0.0650079995393753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,64,balanced,0.06835199892520905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,64,power_law_1.01,0.12012159824371338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,64,power_law_1.01,0.12014080286026001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,64,power_law_1.2,0.11950080394744873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,64,power_law_1.2,0.12064640522003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,8,balanced,0.16160000363985697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,8,balanced,0.16340266664822897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,8,power_law_1.01,0.38083839416503906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,8,power_law_1.01,0.3850048065185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,8,power_law_1.2,0.41621761322021483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,1,8,power_law_1.2,0.4238016128540039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,16,1,balanced,0.2381920019785563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,16,1,balanced,0.23947733640670776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,16,1,power_law_1.01,0.23829119205474852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,16,1,power_law_1.01,0.23892478942871093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,16,1,power_law_1.2,0.23812479972839357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,16,1,power_law_1.2,0.23977599143981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,2,1,balanced,0.44926400979359943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,2,1,balanced,0.454309344291687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,2,1,power_law_1.01,0.4495039939880371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,2,1,power_law_1.01,0.4504000186920166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,2,1,power_law_1.2,0.4470655918121338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,2,1,power_law_1.2,0.45029120445251464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,32,1,balanced,0.18249066670735678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,32,1,balanced,0.1848213275273641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,32,1,power_law_1.01,0.1837183952331543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,32,1,power_law_1.01,0.18405760526657106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,32,1,power_law_1.2,0.18286720514297486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,32,1,power_law_1.2,0.1835263967514038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,4,1,balanced,0.26418133576711017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,4,1,balanced,0.2667520046234131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,4,1,power_law_1.01,0.26488959789276123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,4,1,power_law_1.01,0.2662911891937256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,4,1,power_law_1.2,0.2640064001083374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,4,1,power_law_1.2,0.26684160232543946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,8,1,balanced,0.16612266500790915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,8,1,balanced,0.1662879983584086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,8,1,power_law_1.01,0.1642367959022522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,8,1,power_law_1.01,0.16484479904174804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,8,1,power_law_1.2,0.16310399770736694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,4096,2688,22,512,8,1,power_law_1.2,0.1644863963127136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,1,balanced,0.7107840379079183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,1,balanced,0.7427946726481119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,1,power_law_1.01,0.49120640754699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,1,power_law_1.01,0.5040575981140136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,1,power_law_1.2,0.45343360900878904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,1,power_law_1.2,0.489350414276123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,2,balanced,0.37587201595306396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,2,balanced,0.40010666847229004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,2,power_law_1.01,0.2689536094665527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,2,power_law_1.01,0.31448960304260254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,2,power_law_1.2,0.23677439689636232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,2,power_law_1.2,0.3054527997970581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,4,balanced,0.22262932856877646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,4,balanced,0.2339466611544291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,4,power_law_1.01,0.1794816017150879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,4,power_law_1.01,0.19322880506515502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,4,power_law_1.2,0.17800960540771485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,4,power_law_1.2,0.18620799779891967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,8,balanced,0.14936533570289612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,8,balanced,0.15255999565124512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,8,power_law_1.01,0.15118080377578735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,8,power_law_1.01,0.15190399885177613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,8,power_law_1.2,0.14985599517822265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,1,8,power_law_1.2,0.15014400482177734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,16,1,balanced,0.07035733262697856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,16,1,balanced,0.07042133311430614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,16,1,power_law_1.01,0.05235840082168579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,16,1,power_law_1.01,0.055615997314453124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,16,1,power_law_1.2,0.05046399831771851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,16,1,power_law_1.2,0.05118079781532288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,2,1,balanced,0.37360533078511554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,2,1,balanced,0.40462934970855713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,2,1,power_law_1.01,0.2268160104751587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,2,1,power_law_1.01,0.25057919025421144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,2,1,power_law_1.2,0.21969919204711913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,2,1,power_law_1.2,0.2825920104980469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,32,1,balanced,0.05172266562779745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,32,1,balanced,0.05186133086681366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,32,1,power_law_1.01,0.04158720076084137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,32,1,power_law_1.01,0.04167680144309997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,32,1,power_law_1.2,0.04260480105876922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,32,1,power_law_1.2,0.04302720129489899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,4,1,balanced,0.21411732832590738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,4,1,balanced,0.22878400484720865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,4,1,power_law_1.01,0.13303680419921876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,4,1,power_law_1.01,0.13959039449691774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,4,1,power_law_1.2,0.14295040369033812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,4,1,power_law_1.2,0.15408639907836913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,8,1,balanced,0.13177067041397095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,8,1,balanced,0.14113600055376688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,8,1,power_law_1.01,0.07402880191802978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,8,1,power_law_1.01,0.08238080143928528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,8,1,power_law_1.2,0.07935360074043274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,16384,2,8,8,1,power_law_1.2,0.08957440257072449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,1,balanced,0.3679200013478597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,1,balanced,0.3817226489384969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,1,power_law_1.01,0.3656575918197632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,1,power_law_1.01,0.36589438915252687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,1,power_law_1.2,0.3657792091369629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,1,power_law_1.2,0.36600959300994873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,128,balanced,0.04306666553020477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,128,balanced,0.04347200194994608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,128,power_law_1.01,0.05801600217819214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,128,power_law_1.01,0.058233600854873654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,128,power_law_1.2,0.05824000239372253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,128,power_law_1.2,0.0587007999420166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,16,balanced,0.06002666552861532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,16,balanced,0.06116800010204315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,16,power_law_1.01,0.2102720022201538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,16,power_law_1.01,0.2159424066543579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,16,power_law_1.2,0.17495039701461793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,16,power_law_1.2,0.19825279712677002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,2,balanced,0.21893332401911417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,2,balanced,0.2193066676457723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,2,power_law_1.01,0.2951872110366821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,2,power_law_1.01,0.32143359184265136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,2,power_law_1.2,0.2844223976135254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,2,power_law_1.2,0.2868160009384155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,256,balanced,0.04381866753101349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,256,balanced,0.04423999786376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,256,power_law_1.01,0.04058879911899567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,256,power_law_1.01,0.041388800740242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,256,power_law_1.2,0.040863999724388124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,256,power_law_1.2,0.04162560105323791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,32,balanced,0.04301866888999939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,32,balanced,0.04381866753101349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,32,power_law_1.01,0.13199360370635987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,32,power_law_1.01,0.1327296018600464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,32,power_law_1.2,0.13419519662857055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,32,power_law_1.2,0.13505280017852783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,4,balanced,0.13570132851600647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,4,balanced,0.1358453333377838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,4,power_law_1.01,0.2582144021987915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,4,power_law_1.01,0.2589375972747803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,4,power_law_1.2,0.2124095916748047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,4,power_law_1.2,0.24972798824310302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,64,balanced,0.04377600053946177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,64,balanced,0.04387199878692627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,64,power_law_1.01,0.0741823971271515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,64,power_law_1.01,0.07560960054397584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,64,power_law_1.2,0.07410560250282287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,64,power_law_1.2,0.07485439777374267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,8,balanced,0.07763200004895528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,8,balanced,0.07812800010045369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,8,power_law_1.01,0.23729279041290283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,8,power_law_1.01,0.2551680088043213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,8,power_law_1.2,0.20375680923461914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,1,8,power_law_1.2,0.21841280460357665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,16,1,balanced,0.058592001597086586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,16,1,balanced,0.05991999804973602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,16,1,power_law_1.01,0.05852159857749939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,16,1,power_law_1.01,0.05858560204505921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,16,1,power_law_1.2,0.058169597387313844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,16,1,power_law_1.2,0.05875840187072754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,2,1,balanced,0.21313067277272543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,2,1,balanced,0.21543467044830322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,2,1,power_law_1.01,0.2138688087463379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,2,1,power_law_1.01,0.2154560089111328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,2,1,power_law_1.2,0.21100161075592042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,2,1,power_law_1.2,0.21278719902038573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,32,1,balanced,0.05407999952634176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,32,1,balanced,0.054154664278030396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,32,1,power_law_1.01,0.05446400046348572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,32,1,power_law_1.01,0.05479679703712463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,32,1,power_law_1.2,0.054585599899291994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,32,1,power_law_1.2,0.05495679974555969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,4,1,balanced,0.13124799728393555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,4,1,balanced,0.13386133313179016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,4,1,power_law_1.01,0.12943999767303466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,4,1,power_law_1.01,0.13102079629898072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,4,1,power_law_1.2,0.13055360317230225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,4,1,power_law_1.2,0.13327360153198242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,8,1,balanced,0.07784533500671387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,8,1,balanced,0.07829866806666057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,8,1,power_law_1.01,0.07671679854393006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,8,1,power_law_1.01,0.07777919769287109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,8,1,power_law_1.2,0.07544959783554077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2048,8,256,8,1,power_law_1.2,0.07589120268821717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,1,balanced,0.44830934206644696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,1,balanced,0.45092801253000897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,1,power_law_1.01,0.4482367992401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,1,power_law_1.01,0.44837121963500975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,1,power_law_1.2,0.44871039390563966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,1,power_law_1.2,0.45035519599914553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,16,balanced,0.062421331803003945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,16,balanced,0.06413866579532623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,16,power_law_1.01,0.1622015953063965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,16,power_law_1.01,0.1642367959022522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,16,power_law_1.2,0.17048319578170776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,16,power_law_1.2,0.17125760316848754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,2,balanced,0.24596800406773886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,2,balanced,0.2486720085144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,2,power_law_1.01,0.30064001083374026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,2,power_law_1.01,0.3118783950805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,2,power_law_1.2,0.2780735969543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,2,power_law_1.2,0.29037439823150635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,32,balanced,0.04706133405367533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,32,balanced,0.04959466556708018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,32,power_law_1.01,0.10243200063705445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,32,power_law_1.01,0.10427520275115967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,32,power_law_1.2,0.10348800420761109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,32,power_law_1.2,0.10367360115051269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,4,balanced,0.1458506683508555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,4,balanced,0.14762666821479797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,4,power_law_1.01,0.22364799976348876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,4,power_law_1.01,0.24569599628448485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,4,power_law_1.2,0.2303936004638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,4,power_law_1.2,0.24741759300231933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,8,balanced,0.08470933636029561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,8,balanced,0.08613866567611694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,8,power_law_1.01,0.1831168055534363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,8,power_law_1.01,0.18429440259933472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,8,power_law_1.2,0.1963263988494873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,1,8,power_law_1.2,0.21419520378112794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,16,1,balanced,0.07027199864387512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,16,1,balanced,0.07087466617425282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,16,1,power_law_1.01,0.06838399767875672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,16,1,power_law_1.01,0.06897280216217042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,16,1,power_law_1.2,0.06849920153617858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,16,1,power_law_1.2,0.06911360025405884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,2,1,balanced,0.2410773237546285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,2,1,balanced,0.24200532833735147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,2,1,power_law_1.01,0.2397696018218994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,2,1,power_law_1.01,0.24106240272521973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,2,1,power_law_1.2,0.23971199989318848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,2,1,power_law_1.2,0.2427903890609741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,32,1,balanced,0.05492799977461497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,32,1,balanced,0.0558186670144399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,32,1,power_law_1.01,0.055251199007034305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,32,1,power_law_1.01,0.056032001972198486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,32,1,power_law_1.2,0.05511680245399475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,32,1,power_law_1.2,0.05554559826850891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,4,1,balanced,0.15255999565124512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,4,1,balanced,0.1638879974683126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,4,1,power_law_1.01,0.14314240217208862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,4,1,power_law_1.01,0.14795520305633544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,4,1,power_law_1.2,0.1418239951133728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,4,1,power_law_1.2,0.14362239837646484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,8,1,balanced,0.08947199583053589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,8,1,balanced,0.09101333220799764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,8,1,power_law_1.01,0.0880511999130249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,8,1,power_law_1.01,0.08865919709205627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,8,1,power_law_1.2,0.08805760145187377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,6144,2560,8,160,8,1,power_law_1.2,0.08810880184173583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,1,balanced,0.4252479871114095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,1,balanced,0.42604267597198486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,1,power_law_1.01,0.4222208023071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,1,power_law_1.01,0.4229119777679443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,1,power_law_1.2,0.42177281379699705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,1,power_law_1.2,0.42293758392333985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,128,balanced,0.04770133395989736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,128,balanced,0.049973333875338234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,128,power_law_1.01,0.06217600107192993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,128,power_law_1.01,0.06391680240631104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,128,power_law_1.2,0.06222079992294312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,128,power_law_1.2,0.06280959844589233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,16,balanced,0.06578133503595988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,16,balanced,0.06608533362547557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,16,power_law_1.01,0.24389119148254396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,16,power_law_1.01,0.2471872091293335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,16,power_law_1.2,0.20901761054992676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,16,power_law_1.2,0.2263040065765381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,2,balanced,0.246671994527181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,2,balanced,0.24783466259638467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,2,power_law_1.01,0.3470655918121338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,2,power_law_1.01,0.35129599571228026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,2,power_law_1.2,0.2866111993789673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,2,power_law_1.2,0.3412928104400635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,256,balanced,0.05009600023428599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,256,balanced,0.0513866643110911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,256,power_law_1.01,0.048556798696517946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,256,power_law_1.01,0.0487744003534317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,256,power_law_1.2,0.048403200507164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,256,power_law_1.2,0.05028480291366577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,32,balanced,0.05097066859404246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,32,balanced,0.05207466582457224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,32,power_law_1.01,0.1522752046585083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,32,power_law_1.01,0.15442559719085694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,32,power_law_1.2,0.15314559936523436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,32,power_law_1.2,0.15481599569320678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,4,balanced,0.1548960010210673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,4,balanced,0.15637866655985513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,4,power_law_1.01,0.29907200336456297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,4,power_law_1.01,0.3247744083404541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,4,power_law_1.2,0.27194240093231203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,4,power_law_1.2,0.28570239543914794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,64,balanced,0.04967466493447622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,64,balanced,0.04974400003751119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,64,power_law_1.01,0.08771839737892151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,64,power_law_1.01,0.08882560133934021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,64,power_law_1.2,0.08760960102081299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,64,power_law_1.2,0.08800640106201171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,8,balanced,0.08912000060081482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,8,balanced,0.10097600022951762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,8,power_law_1.01,0.2960319995880127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,8,power_law_1.01,0.3172544002532959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,8,power_law_1.2,0.22003839015960694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,1,8,power_law_1.2,0.23816959857940673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,16,1,balanced,0.06806399921576183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,16,1,balanced,0.06874666611353557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,16,1,power_law_1.01,0.06654719710350036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,16,1,power_law_1.01,0.066975998878479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,16,1,power_law_1.2,0.06647040247917176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,16,1,power_law_1.2,0.06673280000686646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,2,1,balanced,0.24365333716074625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,2,1,balanced,0.2595466574033101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,2,1,power_law_1.01,0.2453696012496948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,2,1,power_law_1.01,0.25589759349823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,2,1,power_law_1.2,0.24218881130218506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,2,1,power_law_1.2,0.24375040531158448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,32,1,balanced,0.061978667974472046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,32,1,balanced,0.0629066675901413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,32,1,power_law_1.01,0.0616703987121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,32,1,power_law_1.01,0.06258559823036194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,32,1,power_law_1.2,0.06250879764556885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,32,1,power_law_1.2,0.0625216007232666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,4,1,balanced,0.1527679959932963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,4,1,balanced,0.17307200034459433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,4,1,power_law_1.01,0.15163520574569703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,4,1,power_law_1.01,0.1530176043510437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,4,1,power_law_1.2,0.15149439573287965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,4,1,power_law_1.2,0.15253759622573854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,8,1,balanced,0.08846400181452434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,8,1,balanced,0.08877866466840108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,8,1,power_law_1.01,0.08798720240592957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,8,1,power_law_1.01,0.08854399919509888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,8,1,power_law_1.2,0.08608639836311341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,256,8,1,power_law_1.2,0.08652799725532531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,1,balanced,0.4256960153579712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,1,balanced,0.42601601282755536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,1,power_law_1.01,0.4225152015686035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,1,power_law_1.01,0.4226687908172607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,1,power_law_1.2,0.42179198265075685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,1,power_law_1.2,0.4248640060424805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,128,balanced,0.0498986691236496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,128,balanced,0.05125333368778229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,128,power_law_1.01,0.06940799951553345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,128,power_law_1.01,0.06970880031585694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,128,power_law_1.2,0.06895999908447266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,128,power_law_1.2,0.06983680129051209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,16,balanced,0.06422933439413707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,16,balanced,0.06434666613737743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,16,power_law_1.01,0.3361855983734131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,16,power_law_1.01,0.3382591962814331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,16,power_law_1.2,0.2865151882171631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,16,power_law_1.2,0.2956543922424316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,2,balanced,0.24966933329900107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,2,balanced,0.2752853234608968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,2,power_law_1.01,0.42868480682373045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,2,power_law_1.01,0.4298880100250244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,2,power_law_1.2,0.35789439678192136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,2,power_law_1.2,0.37303040027618406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,32,balanced,0.05008000135421753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,32,balanced,0.051370665431022644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,32,power_law_1.01,0.1826688051223755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,32,power_law_1.01,0.1847808003425598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,32,power_law_1.2,0.18504960536956788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,32,power_law_1.2,0.1850559949874878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,4,balanced,0.1537493367989858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,4,balanced,0.15450132886568704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,4,power_law_1.01,0.4303743839263916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,4,power_law_1.01,0.4310719966888428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,4,power_law_1.2,0.3273024082183838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,4,power_law_1.2,0.3378623962402344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,64,balanced,0.04987733562787374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,64,balanced,0.052298665046691895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,64,power_law_1.01,0.10739840269088745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,64,power_law_1.01,0.107750403881073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,64,power_law_1.2,0.10767359733581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,64,power_law_1.2,0.10776319503784179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,8,balanced,0.08892800410588582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,8,balanced,0.09411199887593587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,8,power_law_1.01,0.4280831813812256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,8,power_law_1.01,0.4314176082611084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,8,power_law_1.2,0.3173952102661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,1,8,power_law_1.2,0.3205312013626099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,16,1,balanced,0.06791999936103821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,16,1,balanced,0.0680159976085027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,16,1,power_law_1.01,0.06662399768829345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,16,1,power_law_1.01,0.06668800115585327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,16,1,power_law_1.2,0.06567680239677429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,16,1,power_law_1.2,0.06704639792442321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,2,1,balanced,0.24396266539891562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,2,1,balanced,0.24416534105936685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,2,1,power_law_1.01,0.24145920276641847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,2,1,power_law_1.01,0.2427135944366455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,2,1,power_law_1.2,0.24077439308166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,2,1,power_law_1.2,0.24289920330047607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,32,1,balanced,0.062319998939832054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,32,1,balanced,0.0642986645301183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,32,1,power_law_1.01,0.06028159856796265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,32,1,power_law_1.01,0.060627198219299315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,32,1,power_law_1.2,0.06218879818916321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,32,1,power_law_1.2,0.06235520243644714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,4,1,balanced,0.1569493313630422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,4,1,balanced,0.1670666734377543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,4,1,power_law_1.01,0.1544319987297058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,4,1,power_law_1.01,0.15495680570602416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,4,1,power_law_1.2,0.15312000513076782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,4,1,power_law_1.2,0.15457279682159425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,8,1,balanced,0.0881119966506958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,8,1,balanced,0.08875200152397156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,8,1,power_law_1.01,0.08602880239486695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,8,1,power_law_1.01,0.0862335979938507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,8,1,power_law_1.2,0.08624640107154846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4,7168,2048,8,384,8,1,power_law_1.2,0.08669440150260925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,1,balanced,0.49984534581502277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,1,balanced,0.5000160137812296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,1,power_law_1.01,0.6342336177825928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,1,power_law_1.01,0.6440320014953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,1,power_law_1.2,0.6683712005615234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,1,power_law_1.2,0.6690815925598145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,128,balanced,0.22578666607538858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,128,balanced,0.22764267524083456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,128,power_law_1.01,0.24341120719909667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,128,power_law_1.01,0.24455680847167968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,128,power_law_1.2,0.25791358947753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,128,power_law_1.2,0.26005120277404786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,16,balanced,0.24614399671554565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,16,balanced,0.24628265698750815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,16,power_law_1.01,0.275980806350708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,16,power_law_1.01,0.28126718997955324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,16,power_law_1.2,0.2820800065994263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,16,power_law_1.2,0.29447040557861326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,2,balanced,0.4211039940516154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,2,balanced,0.4216426610946655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,2,power_law_1.01,0.48673281669616697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,2,power_law_1.01,0.4878528118133545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,2,power_law_1.2,0.4881599903106689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,2,power_law_1.2,0.5086656093597413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,32,balanced,0.2339893380800883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,32,balanced,0.2351413369178772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,32,power_law_1.01,0.2614847898483276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,32,power_law_1.01,0.2618112087249756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,32,power_law_1.2,0.27467520236968995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,32,power_law_1.2,0.2755136013031006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,4,balanced,0.32210665941238403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,4,balanced,0.3238079945246379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,4,power_law_1.01,0.366156792640686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,4,power_law_1.01,0.373523211479187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,4,power_law_1.2,0.3817023992538452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,4,power_law_1.2,0.3874880075454712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,64,balanced,0.22852800289789835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,64,balanced,0.2298133373260498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,64,power_law_1.01,0.2489408016204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,64,power_law_1.01,0.2498944044113159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,64,power_law_1.2,0.26211841106414796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,64,power_law_1.2,0.2657599925994873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,8,balanced,0.2728266716003418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,8,balanced,0.27323732773462933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,8,power_law_1.01,0.30475521087646484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,8,power_law_1.01,0.32325119972229005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,8,power_law_1.2,0.317139196395874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,1,8,power_law_1.2,0.32108800411224364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,2,1,balanced,0.3718453248341878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,2,1,balanced,0.37194132804870605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,2,1,power_law_1.01,0.41568641662597655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,2,1,power_law_1.01,0.42162561416625977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,2,1,power_law_1.2,0.42785282135009767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,2,1,power_law_1.2,0.428710412979126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,4,1,balanced,0.2715946634610494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,4,1,balanced,0.2722986737887065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,4,1,power_law_1.01,0.30811519622802735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,4,1,power_law_1.01,0.30906879901885986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,4,1,power_law_1.2,0.3090111970901489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2048,768,8,128,4,1,power_law_1.2,0.31128320693969724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,1,balanced,1.2470719814300537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,1,balanced,1.2647733688354492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,1,power_law_1.01,1.3383872032165527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,1,power_law_1.01,1.3628031730651855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,1,power_law_1.2,1.3820159912109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,1,power_law_1.2,1.4014464378356934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,128,balanced,0.29915199677149457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,128,balanced,0.2997066577275594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,128,power_law_1.01,0.33512320518493655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,128,power_law_1.01,0.3445568084716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,128,power_law_1.2,0.3698944091796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,128,power_law_1.2,0.3736191987991333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,16,balanced,0.36085331439971924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,16,balanced,0.3615573247273763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,16,power_law_1.01,0.41254401206970215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,16,power_law_1.01,0.4210239887237549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,16,power_law_1.2,0.4168191909790039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,16,power_law_1.2,0.45070719718933105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,2,balanced,0.8460853099822998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,2,balanced,0.8501813411712646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,2,power_law_1.01,0.9149184226989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,2,power_law_1.01,0.9511360168457031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,2,power_law_1.2,0.9456959724426269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,2,power_law_1.2,0.9469440460205079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,32,balanced,0.3216639955838521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,32,balanced,0.322437326113383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,32,power_law_1.01,0.3678272008895874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,32,power_law_1.01,0.3736576080322266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,32,power_law_1.2,0.39276158809661865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,32,power_law_1.2,0.4074431896209717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,4,balanced,0.5732906659444174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,4,balanced,0.5735573371251425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,4,power_law_1.01,0.6311423778533936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,4,power_law_1.01,0.6400256156921387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,4,power_law_1.2,0.6435455799102783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,4,power_law_1.2,0.6791296005249023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,64,balanced,0.30509867270787555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,64,balanced,0.3051786621411641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,64,power_law_1.01,0.34340479373931887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,64,power_law_1.01,0.3483839988708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,64,power_law_1.2,0.371942400932312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,64,power_law_1.2,0.3786303997039795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,8,balanced,0.4351840019226074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,8,balanced,0.4355893135070801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,8,power_law_1.01,0.48769278526306153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,8,power_law_1.01,0.49470081329345705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,8,power_law_1.2,0.5196288108825684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,1,8,power_law_1.2,0.5330175876617431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,16,1,balanced,0.5744693279266357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,16,1,balanced,0.5751253366470337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,16,1,power_law_1.01,0.60730881690979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,16,1,power_law_1.01,0.6118527889251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,16,1,power_law_1.2,0.6166783809661865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,16,1,power_law_1.2,0.6193535804748536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,2,1,balanced,0.7939519882202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,2,1,balanced,0.7955093383789062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,2,1,power_law_1.01,0.8334591865539551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,2,1,power_law_1.01,0.8394240379333496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,2,1,power_law_1.2,0.8520768165588379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,2,1,power_law_1.2,0.858739185333252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,32,1,balanced,0.46888534228007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,32,1,balanced,0.4691840012868245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,32,1,power_law_1.01,0.4962048053741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,32,1,power_law_1.01,0.49836158752441406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,32,1,power_law_1.2,0.5048384189605712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,32,1,power_law_1.2,0.5111040115356446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,4,1,balanced,0.5033386548360189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,4,1,balanced,0.504858652750651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,4,1,power_law_1.01,0.5331520080566406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,4,1,power_law_1.01,0.5370944023132325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,4,1,power_law_1.2,0.5450496196746826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,4,1,power_law_1.2,0.5466432094573974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,8,1,balanced,0.7272000312805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,8,1,balanced,0.7281333605448405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,8,1,power_law_1.01,0.7720448017120362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,8,1,power_law_1.01,0.7786176204681396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,8,1,power_law_1.2,0.7877439975738525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,2688,1856,6,128,8,1,power_law_1.2,0.7980095863342285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,1,balanced,1.7330773671468098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,1,balanced,1.8105866114298503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,1,power_law_1.01,2.1316864013671877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,1,power_law_1.01,2.226982307434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,1,power_law_1.2,2.2037631988525392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,1,power_law_1.2,2.3808767318725588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,128,balanced,0.3654613494873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,128,balanced,0.36698134740193683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,128,power_law_1.01,0.39898879528045655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,128,power_law_1.01,0.4029888153076172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,128,power_law_1.2,0.42531838417053225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,128,power_law_1.2,0.42755842208862305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,16,balanced,0.44037866592407227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,16,balanced,0.44096533457438153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,16,power_law_1.01,0.5298240184783936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,16,power_law_1.01,0.5310207843780518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,16,power_law_1.2,0.5454463958740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,16,power_law_1.2,0.5563519954681396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,2,balanced,1.0416053136189778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,2,balanced,1.0481759707132976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,2,power_law_1.01,1.3028544425964355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,2,power_law_1.01,1.3035584449768067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,2,power_law_1.2,1.3439807891845703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,2,power_law_1.2,1.358233642578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,256,balanced,0.3614773352940877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,256,balanced,0.3617813189824422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,256,power_law_1.01,0.3878976106643677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,256,power_law_1.01,0.3886080026626587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,256,power_law_1.2,0.41208319664001464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,256,power_law_1.2,0.41861758232116697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,32,balanced,0.3925600051879883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,32,balanced,0.39449600378672284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,32,power_law_1.01,0.4511807918548584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,32,power_law_1.01,0.4598720073699951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,32,power_law_1.2,0.47583999633789065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,32,power_law_1.2,0.47774720191955566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,4,balanced,0.7028906345367432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,4,balanced,0.7050399780273438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,4,power_law_1.01,0.8529279708862305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,4,power_law_1.01,0.8606399536132813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,4,power_law_1.2,0.9003199577331543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,4,power_law_1.2,0.9300224304199218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,64,balanced,0.37195734182993573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,64,balanced,0.37276800473531085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,64,power_law_1.01,0.4136064052581787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,64,power_law_1.01,0.42177281379699705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,64,power_law_1.2,0.433241605758667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,64,power_law_1.2,0.44315519332885744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,8,balanced,0.5248746474583944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,8,balanced,0.5270453294118246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,8,power_law_1.01,0.6391488075256347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,8,power_law_1.01,0.6512959957122803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,8,power_law_1.2,0.6631040096282959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,1,8,power_law_1.2,0.6652416229248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,16,1,balanced,0.3519359827041626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,16,1,balanced,0.3521920045216878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,16,1,power_law_1.01,0.42220158576965333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,16,1,power_law_1.01,0.4235968112945557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,16,1,power_law_1.2,0.4462463855743408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,16,1,power_law_1.2,0.44971518516540526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,2,1,balanced,0.9637066523234049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,2,1,balanced,0.9640693664550781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,2,1,power_law_1.01,1.1965184211730957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,2,1,power_law_1.01,1.2163264274597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,2,1,power_law_1.2,1.2500479698181153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,2,1,power_law_1.2,1.255014419555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,32,1,balanced,0.29789867003758747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,32,1,balanced,0.29919999837875366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,32,1,power_law_1.01,0.361625599861145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,32,1,power_law_1.01,0.3620287895202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,32,1,power_law_1.2,0.3669823884963989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,32,1,power_law_1.2,0.3676352024078369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,4,1,balanced,0.6004480123519897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,4,1,balanced,0.6021440029144287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,4,1,power_law_1.01,0.7327744007110596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,4,1,power_law_1.01,0.7363647937774658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,4,1,power_law_1.2,0.7567103862762451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,4,1,power_law_1.2,0.7616511821746826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,8,1,balanced,0.4229866663614909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,8,1,balanced,0.42473065853118896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,8,1,power_law_1.01,0.5185728073120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,8,1,power_law_1.01,0.5199103832244873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,8,1,power_law_1.2,0.5258368015289306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,3072,1536,8,256,8,1,power_law_1.2,0.5259456157684326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,1,balanced,3.338165283203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,1,balanced,3.4294506708780923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,1,power_law_1.01,3.4284736633300783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,1,power_law_1.01,3.443782424926758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,1,power_law_1.2,3.486713409423828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,1,power_law_1.2,3.5098880767822265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,2,balanced,1.8542985916137695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,2,balanced,1.8965013821919758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,2,power_law_1.01,2.5655744552612303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,2,power_law_1.01,2.687513542175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,2,power_law_1.2,2.279852867126465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,2,power_law_1.2,2.2849920272827147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,4,balanced,1.1284853617350261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,4,balanced,1.1297600269317627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,4,power_law_1.01,1.86810245513916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,4,power_law_1.01,1.9874624252319335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,4,power_law_1.2,1.9043008804321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,4,power_law_1.2,1.9432191848754883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,8,balanced,0.779807964960734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,8,balanced,0.7802293300628662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,8,power_law_1.01,1.5793727874755858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,8,power_law_1.01,1.727743911743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,8,power_law_1.2,1.6281984329223633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,1,8,power_law_1.2,1.7646591186523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,16,1,balanced,0.3006986578305562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,16,1,balanced,0.30212799708048504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,16,1,power_law_1.01,0.3056256055831909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,16,1,power_law_1.01,0.30813438892364503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,16,1,power_law_1.2,0.30426878929138185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,16,1,power_law_1.2,0.30714879035949705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,2,1,balanced,1.5985760688781738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,2,1,balanced,1.6215626398722331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,2,1,power_law_1.01,1.717862319946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,2,1,power_law_1.01,1.727724838256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,2,1,power_law_1.2,1.7006719589233399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,2,1,power_law_1.2,1.7277311325073241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,32,1,balanced,0.19992534319559732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,32,1,balanced,0.2000746726989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,32,1,power_law_1.01,0.20638720989227294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,32,1,power_law_1.01,0.20770559310913086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,32,1,power_law_1.2,0.20560638904571532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,32,1,power_law_1.2,0.20655999183654786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,4,1,balanced,0.8336319923400879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,4,1,balanced,0.8398293654123942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,4,1,power_law_1.01,0.9060864448547363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,4,1,power_law_1.01,0.9133312225341796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,4,1,power_law_1.2,0.9072896003723144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,4,1,power_law_1.2,0.9092864036560059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,8,1,balanced,0.4759039878845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,8,1,balanced,0.47599466641743976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,8,1,power_law_1.01,0.4957759857177734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,8,1,power_law_1.01,0.5012095928192138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,8,1,power_law_1.2,0.4969344139099121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,14336,2,8,8,1,power_law_1.2,0.5002943992614746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,1,balanced,1.8042933146158855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,1,balanced,1.821349302927653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,1,power_law_1.01,2.122764778137207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,1,power_law_1.01,2.149849510192871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,1,power_law_1.2,2.136396789550781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,1,power_law_1.2,2.16497917175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,128,balanced,0.3859306573867798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,128,balanced,0.3867786725362142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,128,power_law_1.01,0.45606398582458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,128,power_law_1.01,0.4606912136077881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,128,power_law_1.2,0.49502081871032716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,128,power_law_1.2,0.5111551761627198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,16,balanced,0.46401600042978924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,16,balanced,0.46556798617045086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,16,power_law_1.01,0.5447743892669678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,16,power_law_1.01,0.5893439769744873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,16,power_law_1.2,0.5888192176818847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,16,power_law_1.2,0.6389503955841065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,2,balanced,1.1017706394195557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,2,balanced,1.1204319794972737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,2,power_law_1.01,1.302995204925537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,2,power_law_1.01,1.3292351722717286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,2,power_law_1.2,1.3642815589904784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,2,power_law_1.2,1.3967743873596192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,32,balanced,0.4188479979832967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,32,balanced,0.4203626712163289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,32,power_law_1.01,0.5196928024291992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,32,power_law_1.01,0.5220223903656006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,32,power_law_1.2,0.5556223869323731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,32,power_law_1.2,0.5638912200927735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,4,balanced,0.7378079891204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,4,balanced,0.7386933167775472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,4,power_law_1.01,0.8958463668823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,4,power_law_1.01,0.8978560447692872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,4,power_law_1.2,0.9325119972229003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,4,power_law_1.2,0.9921024322509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,64,balanced,0.3962506850560506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,64,balanced,0.3988373279571533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,64,power_law_1.01,0.4598656177520752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,64,power_law_1.01,0.47559680938720705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,64,power_law_1.2,0.5245952129364013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,64,power_law_1.2,0.5336128234863281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,8,balanced,0.555621345837911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,8,balanced,0.5565439860026041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,8,power_law_1.01,0.6800191879272461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,8,power_law_1.01,0.7117440223693847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,8,power_law_1.2,0.7258175849914551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,1,8,power_law_1.2,0.7365632057189941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,16,1,balanced,0.4040213425954183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,16,1,balanced,0.40587735176086426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,16,1,power_law_1.01,0.4709951877593994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,16,1,power_law_1.01,0.4716671943664551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,16,1,power_law_1.2,0.4743680000305176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,16,1,power_law_1.2,0.4744448184967041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,2,1,balanced,0.88372270266215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,2,1,balanced,0.8900480270385742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,2,1,power_law_1.01,1.1447423934936523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,2,1,power_law_1.01,1.1712575912475587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,2,1,power_law_1.2,1.185747241973877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,2,1,power_law_1.2,1.1858816146850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,32,1,balanced,0.3454986810684204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,32,1,balanced,0.3455466826756795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,32,1,power_law_1.01,0.40349440574645995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,32,1,power_law_1.01,0.4037759780883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,32,1,power_law_1.2,0.40645761489868165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,32,1,power_law_1.2,0.40750718116760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,4,1,balanced,0.6588693459828695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,4,1,balanced,0.6611733436584473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,4,1,power_law_1.01,0.7544000148773193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,4,1,power_law_1.01,0.7641215801239014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,4,1,power_law_1.2,0.7763391971588135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,4,1,power_law_1.2,0.778982400894165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,8,1,balanced,0.47626666227976483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,8,1,balanced,0.47755201657613117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,8,1,power_law_1.01,0.5441792011260986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,8,1,power_law_1.01,0.5480000019073487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,8,1,power_law_1.2,0.549894380569458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,1536,8,128,8,1,power_law_1.2,0.5524608135223389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,1,balanced,12.55298105875651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,1,balanced,12.923322041829428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,1,power_law_1.01,12.772006225585937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,1,power_law_1.01,12.810092163085937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,1,power_law_1.2,13.002847290039062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,1,power_law_1.2,13.186802673339844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,128,balanced,1.4111839930216472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,128,balanced,1.4123466809590657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,128,power_law_1.01,1.5308095932006835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,128,power_law_1.01,1.5577280044555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,128,power_law_1.2,1.629420852661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,128,power_law_1.2,1.649888038635254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,16,balanced,1.947264035542806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,16,balanced,1.951375961303711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,16,power_law_1.01,2.122329521179199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,16,power_law_1.01,2.1490816116333007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,16,power_law_1.2,2.1753536224365235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,16,power_law_1.2,2.2312959671020507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,2,balanced,6.618810653686523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,2,balanced,6.625781377156575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,2,power_law_1.01,6.93031005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,2,power_law_1.01,6.930764770507812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,2,power_law_1.2,7.167462158203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,2,power_law_1.2,7.56592025756836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,256,balanced,1.3670399983723958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,256,balanced,1.3703840573628743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,256,power_law_1.01,1.4707200050354003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,256,power_law_1.01,1.4851455688476562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,256,power_law_1.2,1.5531968116760253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,256,power_law_1.2,1.5546303749084474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,32,balanced,1.6373333930969238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,32,balanced,1.6375734011332195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,32,power_law_1.01,1.8184640884399415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,32,power_law_1.01,1.849171257019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,32,power_law_1.2,1.9123519897460937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,32,power_law_1.2,1.9202495574951173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,4,balanced,3.828458786010742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,4,balanced,3.918272018432617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,4,power_law_1.01,4.063283157348633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,4,power_law_1.01,4.10761604309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,4,power_law_1.2,4.310886383056641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,4,power_law_1.2,4.336691284179688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,64,balanced,1.4867146809895833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,64,balanced,1.4875413576761882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,64,power_law_1.01,1.6274303436279296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,64,power_law_1.01,1.6453119277954102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,64,power_law_1.2,1.7429376602172852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,64,power_law_1.2,1.7711423873901366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,8,balanced,2.573040008544922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,8,balanced,2.5751466751098633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,8,power_law_1.01,2.83570556640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,8,power_law_1.01,2.8570560455322265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,8,power_law_1.2,2.920390319824219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,1,8,power_law_1.2,3.0350080490112306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,16,1,balanced,3.3945439656575522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,16,1,balanced,3.395375887552897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,16,1,power_law_1.01,3.4960193634033203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,16,1,power_law_1.01,3.4965438842773438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,16,1,power_law_1.2,3.578540802001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,16,1,power_law_1.2,3.592825698852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,2,1,balanced,5.554831822713216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,2,1,balanced,5.844858805338542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,2,1,power_law_1.01,5.71383056640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,2,1,power_law_1.01,5.860019302368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,2,1,power_law_1.2,5.777638244628906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,2,1,power_law_1.2,6.0504192352294925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,32,1,balanced,2.9605334599812827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,32,1,balanced,2.9618825912475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,32,1,power_law_1.01,3.0539520263671873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,32,1,power_law_1.01,3.072422409057617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,32,1,power_law_1.2,3.123481559753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,32,1,power_law_1.2,3.124799919128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,4,1,balanced,8.509637196858725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,4,1,balanced,8.5851198832194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,4,1,power_law_1.01,8.91391372680664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,4,1,power_law_1.01,8.983980560302735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,4,1,power_law_1.2,8.721631622314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,4,1,power_law_1.2,9.087686157226562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,8,1,balanced,2.2380587259928384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,8,1,balanced,2.2496800422668457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,8,1,power_law_1.01,2.244927978515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,8,1,power_law_1.01,2.251481628417969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,8,1,power_law_1.2,2.3016895294189452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,4096,2688,22,512,8,1,power_law_1.2,2.3349632263183593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,1,balanced,5.520762761433919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,1,balanced,5.8908265431722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,1,power_law_1.01,5.7491905212402346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,1,power_law_1.01,6.117657470703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,1,power_law_1.2,5.997491073608399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,1,power_law_1.2,6.05720329284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,2,balanced,3.0503946940104165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,2,balanced,3.08026123046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,2,power_law_1.01,3.815526580810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,2,power_law_1.01,4.681184005737305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,2,power_law_1.2,4.254233551025391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,2,power_law_1.2,4.752115249633789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,4,balanced,1.6810132662455242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,4,balanced,1.7026185989379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,4,power_law_1.01,2.853388786315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,4,power_law_1.01,3.2130817413330077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,4,power_law_1.2,2.9903680801391603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,4,power_law_1.2,2.993465614318848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,8,balanced,1.1320160230000813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,8,balanced,1.1321067015329997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,8,power_law_1.01,2.706547164916992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,8,power_law_1.01,2.809676742553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,8,power_law_1.2,2.7665727615356444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,1,8,power_law_1.2,2.787295913696289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,16,1,balanced,0.44412267208099365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,16,1,balanced,0.4447733163833618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,16,1,power_law_1.01,0.46219520568847655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,16,1,power_law_1.01,0.46302080154418945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,16,1,power_law_1.2,0.4571072101593018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,16,1,power_law_1.2,0.46073598861694337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,2,1,balanced,2.78817081451416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,2,1,balanced,2.958149274190267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,2,1,power_law_1.01,2.84335994720459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,2,1,power_law_1.01,2.843449592590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,2,1,power_law_1.2,2.813164710998535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,2,1,power_law_1.2,2.8429376602172853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,32,1,balanced,0.2901279926300049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,32,1,balanced,0.2911840081214905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,32,1,power_law_1.01,0.29605119228363036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,32,1,power_law_1.01,0.3035520076751709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,32,1,power_law_1.2,0.2967616081237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,32,1,power_law_1.2,0.3005631923675537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,4,1,balanced,1.3901599248250325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,4,1,balanced,1.416437307993571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,4,1,power_law_1.01,1.4558143615722656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,4,1,power_law_1.01,1.4589632034301758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,4,1,power_law_1.2,1.4690943717956544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,4,1,power_law_1.2,1.4727744102478026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,8,1,balanced,0.7319253285725912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,8,1,balanced,0.7401546637217203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,8,1,power_law_1.01,0.7942207813262939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,8,1,power_law_1.01,0.7950528144836426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,8,1,power_law_1.2,0.7965248107910157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,16384,2,8,8,1,power_law_1.2,0.800921630859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,1,balanced,4.2698774337768555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,1,balanced,4.478069305419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,1,power_law_1.01,5.717119979858398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,1,power_law_1.01,5.8063617706298825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,1,power_law_1.2,5.726265716552734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,1,power_law_1.2,6.150905609130859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,128,balanced,0.590768019358317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,128,balanced,0.5931733449300131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,128,power_law_1.01,0.6760191917419434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,128,power_law_1.01,0.6855743885040283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,128,power_law_1.2,0.7208511829376221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,128,power_law_1.2,0.7306047916412354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,16,balanced,0.7852319876352946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,16,balanced,0.7878506978352865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,16,power_law_1.01,0.9721535682678223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,16,power_law_1.01,0.9740287780761718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,16,power_law_1.2,1.0261055946350097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,16,power_law_1.2,1.0631679534912108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,2,balanced,2.4044052759806314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,2,balanced,2.63594659169515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,2,power_law_1.01,3.209638214111328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,2,power_law_1.01,3.233651351928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,2,power_law_1.2,3.204256057739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,2,power_law_1.2,3.2260799407958984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,256,balanced,0.5839466651280721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,256,balanced,0.5858240127563477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,256,power_law_1.01,0.6445631980895996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,256,power_law_1.01,0.6531904220581055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,256,power_law_1.2,0.701798391342163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,256,power_law_1.2,0.724076795578003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,32,balanced,0.673583984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,32,balanced,0.6745440165201823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,32,power_law_1.01,0.8273856163024902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,32,power_law_1.01,0.8674240112304688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,32,power_law_1.2,0.8581760406494141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,32,power_law_1.2,0.8659903526306152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,4,balanced,1.4575519561767578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,4,balanced,1.4737866719563801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,4,power_law_1.01,1.850752067565918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,4,power_law_1.01,1.8861503601074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,4,power_law_1.2,1.9643072128295898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,4,power_law_1.2,2.0059072494506838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,64,balanced,0.6129493316014608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,64,balanced,0.6154346863428751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,64,power_law_1.01,0.7259647846221924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,64,power_law_1.01,0.747372817993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,64,power_law_1.2,0.7978943824768067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,64,power_law_1.2,0.8070015907287598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,8,balanced,1.0064533551534016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,8,balanced,1.007040023803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,8,power_law_1.01,1.2475775718688964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,8,power_law_1.01,1.319699192047119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,8,power_law_1.2,1.3604351997375488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,1,8,power_law_1.2,1.3698495864868163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,16,1,balanced,0.6530186732610067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,16,1,balanced,0.6549973487854004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,16,1,power_law_1.01,0.7884543895721435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,16,1,power_law_1.01,0.7941952228546143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,16,1,power_law_1.2,0.8323967933654786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,16,1,power_law_1.2,0.8350208282470704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,2,1,balanced,2.2383947372436523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,2,1,balanced,2.23854398727417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,2,1,power_law_1.01,2.9180736541748047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,2,1,power_law_1.01,3.0044992446899412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,2,1,power_law_1.2,3.0308351516723633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,2,1,power_law_1.2,3.0980224609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,32,1,balanced,0.5438880125681559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,32,1,balanced,0.5447146495183309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,32,1,power_law_1.01,0.6629759788513183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,32,1,power_law_1.01,0.6652991771697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,32,1,power_law_1.2,0.6726655960083008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,32,1,power_law_1.2,0.6755648136138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,4,1,balanced,1.3103360335032146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,4,1,balanced,1.3156639734903972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,4,1,power_law_1.01,1.6607488632202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,4,1,power_law_1.01,1.6622911453247071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,4,1,power_law_1.2,1.7114431381225585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,4,1,power_law_1.2,1.7281856536865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,8,1,balanced,0.8749866485595703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,8,1,balanced,0.875104029973348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,8,1,power_law_1.01,1.08024320602417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,8,1,power_law_1.01,1.0828031539916991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,8,1,power_law_1.2,1.1253952026367187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2048,8,256,8,1,power_law_1.2,1.1256511688232422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,1,balanced,5.3330027262369795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,1,balanced,5.412570953369141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,1,power_law_1.01,6.033337783813477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,1,power_law_1.01,6.070329666137695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,1,power_law_1.2,5.854995346069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,1,power_law_1.2,5.982675170898437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,16,balanced,0.8418880303700765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,16,balanced,0.8446933428446451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,16,power_law_1.01,1.0360832214355469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,16,power_law_1.01,1.0614848136901855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,16,power_law_1.2,1.1084608078002929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,16,power_law_1.2,1.1601920127868652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,2,balanced,2.9069334665934243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,2,balanced,2.963184038798014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,2,power_law_1.01,3.2878528594970704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,2,power_law_1.01,3.3367935180664063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,2,power_law_1.2,3.379199981689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,2,power_law_1.2,3.481305694580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,32,balanced,0.7066400051116943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,32,balanced,0.7076799869537354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,32,power_law_1.01,0.8373311996459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,32,power_law_1.01,0.9089152336120605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,32,power_law_1.2,1.0100288391113281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,32,power_law_1.2,1.0214271545410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,4,balanced,1.6856266657511394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,4,balanced,1.693610668182373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,4,power_law_1.01,1.9992319107055665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,4,power_law_1.01,2.0214975357055662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,4,power_law_1.2,2.1229503631591795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,4,power_law_1.2,2.1475456237792967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,8,balanced,1.1142559846242268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,8,balanced,1.1150133609771729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,8,power_law_1.01,1.350425624847412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,8,power_law_1.01,1.382585620880127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,8,power_law_1.2,1.4352255821228028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,1,8,power_law_1.2,1.5088512420654296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,16,1,balanced,0.7581546306610107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,16,1,balanced,0.7592746416727701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,16,1,power_law_1.01,0.7992767810821533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,16,1,power_law_1.01,0.8031423568725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,16,1,power_law_1.2,0.8061247825622558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,16,1,power_law_1.2,0.8074239730834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,2,1,balanced,2.6768531799316406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,2,1,balanced,2.8551413218180337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,2,1,power_law_1.01,2.9929344177246096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,2,1,power_law_1.01,3.0077056884765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,2,1,power_law_1.2,2.895257568359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,2,1,power_law_1.2,3.0628543853759767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,32,1,balanced,0.6553013324737549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,32,1,balanced,0.6553333202997843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,32,1,power_law_1.01,0.6882559776306152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,32,1,power_law_1.01,0.6895872116088867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,32,1,power_law_1.2,0.695084810256958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,32,1,power_law_1.2,0.6965439796447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,4,1,balanced,1.5253973007202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,4,1,balanced,1.5787413914998372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,4,1,power_law_1.01,1.6493440628051759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,4,1,power_law_1.01,1.6734336853027343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,4,1,power_law_1.2,1.6878976821899414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,4,1,power_law_1.2,1.7276416778564454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,8,1,balanced,0.9791573683420817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,8,1,balanced,0.9805440107981364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,8,1,power_law_1.01,1.0607616424560546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,8,1,power_law_1.01,1.066534423828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,8,1,power_law_1.2,1.0682496070861816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,6144,2560,8,160,8,1,power_law_1.2,1.0772095680236817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,1,balanced,5.007520039876302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,1,balanced,5.07695992787679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,1,power_law_1.01,6.955763244628907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,1,power_law_1.01,6.995737457275391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,1,power_law_1.2,7.038137817382813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,1,power_law_1.2,7.048563385009766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,128,balanced,0.6508586804072062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,128,balanced,0.6519146760304769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,128,power_law_1.01,0.7570816040039062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,128,power_law_1.01,0.7632959842681885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,128,power_law_1.2,0.8048768043518066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,128,power_law_1.2,0.8236607551574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,16,balanced,0.8822133541107178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,16,balanced,0.8827253182729086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,16,power_law_1.01,1.0896448135375976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,16,power_law_1.01,1.0943615913391114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,16,power_law_1.2,1.1809727668762207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,16,power_law_1.2,1.2017919540405273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,2,balanced,2.9151414235432944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,2,balanced,2.920570691426595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,2,power_law_1.01,3.558720016479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,2,power_law_1.01,3.8495296478271483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,2,power_law_1.2,3.85351676940918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,2,power_law_1.2,4.102438354492188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,256,balanced,0.6408426761627197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,256,balanced,0.6455519994099935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,256,power_law_1.01,0.7183487892150879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,256,power_law_1.01,0.722540807723999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,256,power_law_1.2,0.7760255813598633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,256,power_law_1.2,0.7781311988830566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,32,balanced,0.7476960023244222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,32,balanced,0.7481599648793539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,32,power_law_1.01,0.8812352180480957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,32,power_law_1.01,0.9133952140808106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,32,power_law_1.2,0.9649727821350098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,32,power_law_1.2,0.9934399604797364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,4,balanced,1.679690678914388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,4,balanced,1.6840640703837078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,4,power_law_1.01,2.176038360595703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,4,power_law_1.01,2.1963903427124025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,4,power_law_1.2,2.2641536712646486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,4,power_law_1.2,2.3686592102050783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,64,balanced,0.6772747039794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,64,balanced,0.679365317026774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,64,power_law_1.01,0.8054207801818848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,64,power_law_1.01,0.811404800415039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,64,power_law_1.2,0.8899904251098633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,64,power_law_1.2,0.9034367561340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,8,balanced,1.135973294576009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,8,balanced,1.1393493016560872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,8,power_law_1.01,1.4429056167602539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,8,power_law_1.01,1.4748479843139648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,8,power_law_1.2,1.5720319747924805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,1,8,power_law_1.2,1.667673683166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,16,1,balanced,0.7534613609313965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,16,1,balanced,0.7546133200327555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,16,1,power_law_1.01,0.8994367599487305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,16,1,power_law_1.01,0.9319040298461914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,16,1,power_law_1.2,0.9466560363769532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,16,1,power_law_1.2,0.9631744384765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,2,1,balanced,2.6882025400797525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,2,1,balanced,2.8044745127360025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,2,1,power_law_1.01,3.429132843017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,2,1,power_law_1.01,3.530854415893555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,2,1,power_law_1.2,3.5767166137695314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,2,1,power_law_1.2,3.626764678955078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,32,1,balanced,0.625493327776591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,32,1,balanced,0.6256639957427979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,32,1,power_law_1.01,0.7660863876342774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,32,1,power_law_1.01,0.7661695957183838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,32,1,power_law_1.2,0.7776000022888183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,32,1,power_law_1.2,0.7783232212066651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,4,1,balanced,1.5413600603739421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,4,1,balanced,1.5453012784322102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,4,1,power_law_1.01,1.9349632263183594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,4,1,power_law_1.01,1.9383743286132813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,4,1,power_law_1.2,1.9776960372924806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,4,1,power_law_1.2,2.0029184341430666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,8,1,balanced,1.0132533709208171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,8,1,balanced,1.0142133235931396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,8,1,power_law_1.01,1.2391807556152343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,8,1,power_law_1.01,1.247539234161377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,8,1,power_law_1.2,1.3032959938049316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,256,8,1,power_law_1.2,1.3064959526062012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,1,balanced,7.315893173217773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,1,balanced,7.511781056722005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,1,power_law_1.01,8.365126037597657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,1,power_law_1.01,8.467244720458984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,1,power_law_1.2,8.796006774902343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,1,power_law_1.2,9.12613754272461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,128,balanced,0.7205333709716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,128,balanced,0.7219253381093343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,128,power_law_1.01,0.8053055763244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,128,power_law_1.01,0.8145536422729492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,128,power_law_1.2,0.8578368186950683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,128,power_law_1.2,0.8592960357666015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,16,balanced,1.0529812971750896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,16,balanced,1.0555946826934814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,16,power_law_1.01,1.1921024322509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,16,power_law_1.01,1.2020352363586426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,16,power_law_1.2,1.2602944374084473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,16,power_law_1.2,1.321171188354492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,2,balanced,3.9656906127929688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,2,balanced,4.011381467183431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,2,power_law_1.01,4.352441787719727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,2,power_law_1.01,4.464755249023438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,2,power_law_1.2,4.804748916625977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,2,power_law_1.2,5.044160079956055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,32,balanced,0.869109312693278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,32,balanced,0.8712639808654785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,32,power_law_1.01,0.9912832260131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,32,power_law_1.01,0.9991488456726074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,32,power_law_1.2,1.0286656379699708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,32,power_law_1.2,1.0289152145385743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,4,balanced,2.2001120249430337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,4,balanced,2.2161973317464194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,4,power_law_1.01,2.490233612060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,4,power_law_1.01,2.544236755371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,4,power_law_1.2,2.704640007019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,4,power_law_1.2,2.793164825439453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,64,balanced,0.7649333477020264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,64,balanced,0.7677919864654541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,64,power_law_1.01,0.8617792129516602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,64,power_law_1.01,0.8646400451660157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,64,power_law_1.2,0.9187583923339844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,64,power_law_1.2,0.9226304054260254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,8,balanced,1.438912073771159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,8,balanced,1.4439627329508464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,8,power_law_1.01,1.6619840621948243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,8,power_law_1.01,1.7060991287231446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,8,power_law_1.2,1.7444927215576171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,1,8,power_law_1.2,1.8415231704711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,16,1,balanced,0.9636480013529459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,16,1,balanced,0.9637440045674642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,16,1,power_law_1.01,1.075692844390869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,16,1,power_law_1.01,1.0764415740966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,16,1,power_law_1.2,1.1015359878540039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,16,1,power_law_1.2,1.102188777923584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,2,1,balanced,3.772698720296224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,2,1,balanced,3.8254931767781577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,2,1,power_law_1.01,4.254719924926758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,2,1,power_law_1.01,4.285804748535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,2,1,power_law_1.2,4.485087966918945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,2,1,power_law_1.2,4.540595245361328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,32,1,balanced,0.8049919605255127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,32,1,balanced,0.8081280390421549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,32,1,power_law_1.01,0.8601280212402344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,32,1,power_law_1.01,0.8671615600585938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,32,1,power_law_1.2,0.8786751747131347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,32,1,power_law_1.2,0.8863615989685059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,4,1,balanced,2.0765280723571777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,4,1,balanced,2.119210720062256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,4,1,power_law_1.01,2.334105682373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,4,1,power_law_1.01,2.3400896072387694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,4,1,power_law_1.2,2.4197824478149412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,4,1,power_law_1.2,2.475872039794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,8,1,balanced,1.3386613527933757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,8,1,balanced,1.3418879508972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,8,1,power_law_1.01,1.4885696411132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,8,1,power_law_1.01,1.5030847549438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,8,1,power_law_1.2,1.548908805847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,4096,7168,2048,8,384,8,1,power_law_1.2,1.561619186401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,1,balanced,0.206986665725708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,1,balanced,0.2081813414891561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,1,power_law_1.01,0.18387839794158936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,1,power_law_1.01,0.1861631989479065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,1,power_law_1.2,0.1855039954185486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,1,power_law_1.2,0.18766720294952394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,128,balanced,0.033488000432650246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,128,balanced,0.03359466542800268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,128,power_law_1.01,0.03210879862308502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,128,power_law_1.01,0.033395200967788696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,128,power_law_1.2,0.03237119913101196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,128,power_law_1.2,0.03281280100345611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,16,balanced,0.041536000867684685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,16,balanced,0.04180799921353658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,16,power_law_1.01,0.040838399529457094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,16,power_law_1.01,0.04110719859600067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,16,power_law_1.2,0.04020479917526245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,16,power_law_1.2,0.040345600247383116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,2,balanced,0.13770133256912231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,2,balanced,0.14827733238538107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,2,power_law_1.01,0.12628480195999145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,2,power_law_1.01,0.12747520208358765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,2,power_law_1.2,0.1273151993751526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,2,power_law_1.2,0.12827520370483397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,32,balanced,0.03572266548871994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,32,balanced,0.03751999884843826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,32,power_law_1.01,0.0347135990858078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,32,power_law_1.01,0.034764799475669864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,32,power_law_1.2,0.03503359854221344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,32,power_law_1.2,0.03624320030212402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,4,balanced,0.08922666311264038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,4,balanced,0.09013866384824117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,4,power_law_1.01,0.08359040021896362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,4,power_law_1.01,0.08485119938850402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,4,power_law_1.2,0.08113279938697815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,4,power_law_1.2,0.08243839740753174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,64,balanced,0.035216001172860466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,64,balanced,0.035546667873859406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,64,power_law_1.01,0.03266560137271881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,64,power_law_1.01,0.032767999172210696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,64,power_law_1.2,0.032979199290275575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,64,power_law_1.2,0.03318400084972382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,8,balanced,0.05856533348560333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,8,balanced,0.059546664357185364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,8,power_law_1.01,0.05368319749832153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,8,power_law_1.01,0.05511040091514587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,8,power_law_1.2,0.055180799961090085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,1,8,power_law_1.2,0.05541120171546936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,2,1,balanced,0.14010666807492575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,2,1,balanced,0.1402666668097178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,2,1,power_law_1.01,0.12665599584579468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,2,1,power_law_1.01,0.13148159980773927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,2,1,power_law_1.2,0.1277567982673645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,2,1,power_law_1.2,0.12949759960174562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,4,1,balanced,0.09967466195424397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,4,1,balanced,0.10126399993896484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,4,1,power_law_1.01,0.09064319729804993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,4,1,power_law_1.01,0.09114239811897278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,4,1,power_law_1.2,0.09091200232505799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2048,768,8,128,4,1,power_law_1.2,0.09198079705238342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,1,balanced,0.5775839885075887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,1,balanced,0.5814400116602579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,1,power_law_1.01,0.4839615821838379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,1,power_law_1.01,0.49049601554870603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,1,power_law_1.2,0.47049598693847655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,1,power_law_1.2,0.48731517791748047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,128,balanced,0.04154666761557261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,128,balanced,0.041706666350364685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,128,power_law_1.01,0.039904001355171206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,128,power_law_1.01,0.04002560079097748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,128,power_law_1.2,0.040268799662590025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,128,power_law_1.2,0.04062080085277557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,16,balanced,0.07281599938869476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,16,balanced,0.07323200007279713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,16,power_law_1.01,0.0697920024394989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,16,power_law_1.01,0.06998400092124939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,16,power_law_1.2,0.06937599778175355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,16,power_law_1.2,0.07041919827461243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,2,balanced,0.3373386859893799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,2,balanced,0.3398666779200236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,2,power_law_1.01,0.2834496021270752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,2,power_law_1.01,0.2936896085739136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,2,power_law_1.2,0.2700608015060425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,2,power_law_1.2,0.2919424057006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,32,balanced,0.05724266668160757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,32,balanced,0.05819733440876007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,32,power_law_1.01,0.054745602607727054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,32,power_law_1.01,0.05570560097694397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,32,power_law_1.2,0.054681599140167236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,32,power_law_1.2,0.05608320236206055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,4,balanced,0.19754133621851602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,4,balanced,0.20081599553426108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,4,power_law_1.01,0.16079360246658325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,4,power_law_1.01,0.17436800003051758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,4,power_law_1.2,0.1572864055633545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,4,power_law_1.2,0.16430720090866088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,64,balanced,0.04609066744645437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,64,balanced,0.0461706668138504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,64,power_law_1.01,0.04511359930038452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,64,power_law_1.01,0.04521600008010864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,64,power_law_1.2,0.04442879855632782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,64,power_law_1.2,0.04477440118789673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,8,balanced,0.1225226620833079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,8,balanced,0.12425067027409871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,8,power_law_1.01,0.11208959817886352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,8,power_law_1.01,0.11244800090789794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,8,power_law_1.2,0.10680320262908935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,1,8,power_law_1.2,0.11436159610748291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,16,1,balanced,0.23836266994476318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,16,1,balanced,0.23836799462636313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,16,1,power_law_1.01,0.19242240190505983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,16,1,power_law_1.01,0.19512319564819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,16,1,power_law_1.2,0.1974400043487549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,16,1,power_law_1.2,0.2026304006576538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,2,1,balanced,0.34487466017405194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,2,1,balanced,0.3468960126241048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,2,1,power_law_1.01,0.2880064010620117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,2,1,power_law_1.01,0.2886399984359741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,2,1,power_law_1.2,0.28373119831085203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,2,1,power_law_1.2,0.2905407905578613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,32,1,balanced,0.2232266664505005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,32,1,balanced,0.2236479918162028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,32,1,power_law_1.01,0.18036479949951173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,32,1,power_law_1.01,0.18662400245666505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,32,1,power_law_1.2,0.18256640434265137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,32,1,power_law_1.2,0.18273919820785522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,4,1,balanced,0.20798399051030478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,4,1,balanced,0.20879999796549478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,4,1,power_law_1.01,0.17079039812088012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,4,1,power_law_1.01,0.1715775966644287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,4,1,power_law_1.2,0.1729151964187622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,4,1,power_law_1.2,0.1730687975883484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,8,1,balanced,0.307696004708608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,8,1,balanced,0.30884265899658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,8,1,power_law_1.01,0.2603775978088379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,8,1,power_law_1.01,0.2616703987121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,8,1,power_law_1.2,0.25401599407196046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,2688,1856,6,128,8,1,power_law_1.2,0.25836160182952883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,1,balanced,1.094048023223877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,1,balanced,1.0972426732381184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,1,power_law_1.01,0.7965119838714599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,1,power_law_1.01,0.8038911819458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,1,power_law_1.2,0.7764863967895508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,1,power_law_1.2,0.7889344215393066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,128,balanced,0.045754666129748024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,128,balanced,0.046581332882245384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,128,power_law_1.01,0.04447999894618988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,128,power_law_1.01,0.04499199986457825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,128,power_law_1.2,0.04469119906425476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,128,power_law_1.2,0.04506239891052246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,16,balanced,0.12034666538238525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,16,balanced,0.12081600228945415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,16,power_law_1.01,0.10191359519958496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,16,power_law_1.01,0.10823040008544922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,16,power_law_1.2,0.1017151951789856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,16,power_law_1.2,0.10362880229949951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,2,balanced,0.578437328338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,2,balanced,0.5806080102920532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,2,power_law_1.01,0.43283839225769044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,2,power_law_1.01,0.45070719718933105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,2,power_law_1.2,0.42665600776672363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,2,power_law_1.2,0.4507775783538818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,256,balanced,0.04357333481311798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,256,balanced,0.04390933116277059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,256,power_law_1.01,0.042828801274299624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,256,power_law_1.01,0.04302079975605011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,256,power_law_1.2,0.04325760006904602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,256,power_law_1.2,0.04332799911499023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,32,balanced,0.07467199862003326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,32,balanced,0.07684266567230225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,32,power_law_1.01,0.06964480280876159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,32,power_law_1.01,0.07048959732055664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,32,power_law_1.2,0.06771199703216553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,32,power_law_1.2,0.06903679966926575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,4,balanced,0.3169599970181783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,4,balanced,0.3298186659812927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,4,power_law_1.01,0.22748799324035646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,4,power_law_1.01,0.25423359870910645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,4,power_law_1.2,0.2654207944869995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,4,power_law_1.2,0.2699199914932251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,64,balanced,0.057717333237330117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,64,balanced,0.0588319996992747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,64,power_law_1.01,0.05572479963302612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,64,power_law_1.01,0.05591679811477661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,64,power_law_1.2,0.05533440113067627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,64,power_law_1.2,0.056704002618789676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,8,balanced,0.18275733788808188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,8,balanced,0.1844693422317505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,8,power_law_1.01,0.1417088031768799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,8,power_law_1.01,0.15155199766159058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,8,power_law_1.2,0.159660804271698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,1,8,power_law_1.2,0.16246399879455567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,16,1,balanced,0.1644480029741923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,16,1,balanced,0.16643200318018594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,16,1,power_law_1.01,0.11695359945297241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,16,1,power_law_1.01,0.11742719411849975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,16,1,power_law_1.2,0.1137727975845337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,16,1,power_law_1.2,0.11628160476684571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,2,1,balanced,0.5859786669413248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,2,1,balanced,0.5991093317667643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,2,1,power_law_1.01,0.4324607849121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,2,1,power_law_1.01,0.43571839332580564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,2,1,power_law_1.2,0.42322559356689454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,2,1,power_law_1.2,0.4301439762115479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,32,1,balanced,0.13436800241470337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,32,1,balanced,0.13573333621025085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,32,1,power_law_1.01,0.10609920024871826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,32,1,power_law_1.01,0.10618879795074462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,32,1,power_law_1.2,0.10426239967346192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,32,1,power_law_1.2,0.10460159778594971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,4,1,balanced,0.3397279977798462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,4,1,balanced,0.3397333224614461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,4,1,power_law_1.01,0.2523008108139038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,4,1,power_law_1.01,0.2525439977645874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,4,1,power_law_1.2,0.2506047964096069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,4,1,power_law_1.2,0.2508352041244507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,8,1,balanced,0.22420267264048258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,8,1,balanced,0.22449066241582236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,8,1,power_law_1.01,0.1650239944458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,8,1,power_law_1.01,0.16727039813995362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,8,1,power_law_1.2,0.16060160398483275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,3072,1536,8,256,8,1,power_law_1.2,0.162336003780365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,1,balanced,0.46299731731414795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,1,balanced,0.46459734439849854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,1,power_law_1.01,0.45425920486450194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,1,power_law_1.01,0.46524801254272463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,1,power_law_1.2,0.4677696228027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,1,power_law_1.2,0.46808319091796874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,2,balanced,0.28462400039037067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,2,balanced,0.2863679925600688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,2,power_law_1.01,0.297708797454834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,2,power_law_1.01,0.29950718879699706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,2,power_law_1.2,0.2973952054977417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,2,power_law_1.2,0.29881598949432375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,4,balanced,0.18986133734385172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,4,balanced,0.2004106640815735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,4,power_law_1.01,0.19596799612045288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,4,power_law_1.01,0.20924160480499268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,4,power_law_1.2,0.18863359689712525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,4,power_law_1.2,0.21047680377960204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,8,balanced,0.13481066624323526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,8,balanced,0.13552000125249228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,8,power_law_1.01,0.14369920492172242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,8,power_law_1.01,0.15239039659500123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,8,power_law_1.2,0.14190080165863037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,1,8,power_law_1.2,0.15321600437164307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,16,1,balanced,0.05820799867312113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,16,1,balanced,0.06006933252016703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,16,1,power_law_1.01,0.057017600536346434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,16,1,power_law_1.01,0.05751680135726929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,16,1,power_law_1.2,0.05639680027961731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,16,1,power_law_1.2,0.056883198022842404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,2,1,balanced,0.2532479961713155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,2,1,balanced,0.2537600000699361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,2,1,power_law_1.01,0.24821119308471679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,2,1,power_law_1.01,0.25728640556335447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,2,1,power_law_1.2,0.25106561183929443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,2,1,power_law_1.2,0.2589184045791626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,32,1,balanced,0.04171200096607208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,32,1,balanced,0.04553066690762838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,32,1,power_law_1.01,0.041280001401901245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,32,1,power_law_1.01,0.04223999977111816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,32,1,power_law_1.2,0.04200960099697113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,32,1,power_law_1.2,0.04343039989471435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,4,1,balanced,0.1463093360265096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,4,1,balanced,0.15547200043996176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,4,1,power_law_1.01,0.1401919960975647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,4,1,power_law_1.01,0.14298239946365357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,4,1,power_law_1.2,0.145305597782135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,4,1,power_law_1.2,0.1453760027885437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,8,1,balanced,0.09527466694513957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,8,1,balanced,0.09692266583442688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,8,1,power_law_1.01,0.08049280047416688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,8,1,power_law_1.01,0.08272640109062195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,8,1,power_law_1.2,0.08163840174674988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,14336,2,8,8,1,power_law_1.2,0.08247039914131164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,1,balanced,0.7592960198720297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,1,balanced,0.7662453651428223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,1,power_law_1.01,0.6669375896453857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,1,power_law_1.01,0.6677248001098632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,1,power_law_1.2,0.6746560096740722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,1,power_law_1.2,0.6774144172668457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,128,balanced,0.04558933277924856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,128,balanced,0.04586133360862732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,128,power_law_1.01,0.045049598813056944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,128,power_law_1.01,0.04535680115222931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,128,power_law_1.2,0.04470399916172028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,128,power_law_1.2,0.0451200008392334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,16,balanced,0.08879466851552327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,16,balanced,0.08892266949017842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,16,power_law_1.01,0.08112639784812928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,16,power_law_1.01,0.08399999737739564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,16,power_law_1.2,0.08261119723320007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,16,power_law_1.2,0.08315520286560059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,2,balanced,0.41283198197682697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,2,balanced,0.414192001024882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,2,power_law_1.01,0.35820159912109373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,2,power_law_1.01,0.36479361057281495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,2,power_law_1.2,0.3734591960906982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,2,power_law_1.2,0.3743808031082153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,32,balanced,0.06621333460013072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,32,balanced,0.067071999112765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,32,power_law_1.01,0.06451200246810913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,32,power_law_1.01,0.06479359865188598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,32,power_law_1.2,0.06377599835395813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,32,power_law_1.2,0.06552960276603699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,4,balanced,0.23226666450500488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,4,balanced,0.23422932624816895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,4,power_law_1.01,0.21624319553375243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,4,power_law_1.01,0.21953279972076417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,4,power_law_1.2,0.2182784080505371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,4,power_law_1.2,0.21953918933868408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,64,balanced,0.04986133178075155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,64,balanced,0.052890668312708534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,64,power_law_1.01,0.0490880012512207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,64,power_law_1.01,0.049497601389884946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,64,power_law_1.2,0.0495743989944458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,64,power_law_1.2,0.05177599787712097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,8,balanced,0.14814399679501852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,8,power_law_1.01,0.139628803730011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,8,power_law_1.01,0.14136960506439208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,8,power_law_1.2,0.14153599739074707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,1,8,power_law_1.2,0.14209920167922974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,16,1,balanced,0.11473066608111064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,16,1,balanced,0.11559999982515971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,16,1,power_law_1.01,0.10314240455627441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,16,1,power_law_1.01,0.10477440357208252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,16,1,power_law_1.2,0.10392320156097412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,16,1,power_law_1.2,0.10606720447540283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,2,1,balanced,0.3835306564966838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,2,1,balanced,0.3887253204981486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,2,1,power_law_1.01,0.3392767906188965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,2,1,power_law_1.01,0.3402496099472046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,2,1,power_law_1.2,0.341644811630249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,2,1,power_law_1.2,0.3426815986633301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,32,1,balanced,0.10283199946085612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,32,1,balanced,0.10319999853769939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,32,1,power_law_1.01,0.09411200284957885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,32,1,power_law_1.01,0.09574400186538697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,32,1,power_law_1.2,0.09435520172119141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,32,1,power_law_1.2,0.09493759870529175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,4,1,balanced,0.24418665965398154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,4,1,balanced,0.2456000049908956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,4,1,power_law_1.01,0.22358400821685792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,4,1,power_law_1.01,0.22736001014709473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,4,1,power_law_1.2,0.22722558975219725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,4,1,power_law_1.2,0.22951679229736327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,8,1,balanced,0.17293334007263184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,8,1,balanced,0.17620799938837686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,8,1,power_law_1.01,0.15203839540481567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,8,1,power_law_1.01,0.15781760215759277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,8,1,power_law_1.2,0.15812480449676514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,1536,8,128,8,1,power_law_1.2,0.1619328022003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,1,balanced,4.999557177225749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,1,balanced,4.999850591023763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,1,power_law_1.01,3.896889495849609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,1,power_law_1.01,3.949625778198242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,1,power_law_1.2,3.899814224243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,1,power_law_1.2,3.9953407287597655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,128,balanced,0.11739200353622437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,128,balanced,0.11752532919247945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,128,power_law_1.01,0.11438720226287842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,128,power_law_1.01,0.11543680429458618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,128,power_law_1.2,0.1125823974609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,128,power_law_1.2,0.11310720443725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,16,balanced,0.3933546543121338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,16,balanced,0.3940906524658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,16,power_law_1.01,0.33834879398345946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,16,power_law_1.01,0.343667197227478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,16,power_law_1.2,0.3301759958267212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,16,power_law_1.2,0.33223040103912355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,2,balanced,2.5022452672322593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,2,balanced,2.5851786931355796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,2,power_law_1.01,2.098611259460449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,2,power_law_1.01,2.136000061035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,2,power_law_1.2,2.0809024810791015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,2,power_law_1.2,2.082854461669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,256,balanced,0.09687999884287517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,256,balanced,0.09723732868830363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,256,power_law_1.01,0.0960640013217926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,256,power_law_1.01,0.09646080136299133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,256,power_law_1.2,0.09635840058326721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,256,power_law_1.2,0.09659519791603088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,32,balanced,0.24261866013209024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,32,balanced,0.24269866943359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,32,power_law_1.01,0.21084799766540527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,32,power_law_1.01,0.22079360485076904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,32,power_law_1.2,0.2153088092803955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,32,power_law_1.2,0.22773120403289795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,4,balanced,1.302026669184367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,4,balanced,1.3028159936269124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,4,power_law_1.01,1.1259967803955078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,4,power_law_1.01,1.1366592407226563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,4,power_law_1.2,1.0518783569335937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,4,power_law_1.2,1.1823360443115234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,64,balanced,0.16665599743525186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,64,balanced,0.1689173380533854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,64,power_law_1.01,0.1579327940940857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,64,power_law_1.01,0.15955840349197387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,64,power_law_1.2,0.15860480070114136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,64,power_law_1.2,0.1587839961051941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,8,balanced,0.7015360196431478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,8,balanced,0.7017386754353842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,8,power_law_1.01,0.6222527980804443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,8,power_law_1.01,0.6234176158905029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,8,power_law_1.2,0.5516799926757813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,1,8,power_law_1.2,0.6026303768157959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,16,1,balanced,1.570101261138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,16,1,balanced,1.5749972661336262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,16,1,power_law_1.01,1.2483776092529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,16,1,power_law_1.01,1.257817554473877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,16,1,power_law_1.2,1.2415743827819825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,16,1,power_law_1.2,1.2651328086853026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,2,1,balanced,2.4123573303222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,2,1,balanced,2.4192585945129395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,2,1,power_law_1.01,1.8845504760742187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,2,1,power_law_1.01,1.9240127563476563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,2,1,power_law_1.2,1.8891008377075196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,2,1,power_law_1.2,1.9054719924926757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,32,1,balanced,1.2661759853363037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,32,1,balanced,1.2669440110524495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,32,1,power_law_1.01,1.0242239952087402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,32,1,power_law_1.01,1.0259712219238282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,32,1,power_law_1.2,1.0163007736206056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,32,1,power_law_1.2,1.0246527671813965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,4,1,balanced,1.428709348042806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,4,1,balanced,1.4310933748881023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,4,1,power_law_1.01,1.1552255630493165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,4,1,power_law_1.01,1.1621503829956055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,4,1,power_law_1.2,1.1261247634887694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,4,1,power_law_1.2,1.146617603302002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,8,1,balanced,0.7987519900004069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,8,1,balanced,0.7996640205383301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,8,1,power_law_1.01,0.6447679996490479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,8,1,power_law_1.01,0.6447936058044433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,8,1,power_law_1.2,0.6430399894714356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,4096,2688,22,512,8,1,power_law_1.2,0.6488192081451416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,1,balanced,0.7834239800771078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,1,balanced,0.7908533414204916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,1,power_law_1.01,0.8342911720275878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,1,power_law_1.01,0.8431232452392579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,1,power_law_1.2,0.8376832008361816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,1,power_law_1.2,0.8395071983337402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,2,balanced,0.4388959805170695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,2,balanced,0.4585973421732585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,2,power_law_1.01,0.4569087982177734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,2,power_law_1.01,0.4634880065917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,2,power_law_1.2,0.4544960021972656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,2,power_law_1.2,0.4643263816833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,4,balanced,0.24808533986409506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,4,balanced,0.24914666016896567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,4,power_law_1.01,0.27852160930633546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,4,power_law_1.01,0.31008639335632326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,4,power_law_1.2,0.26537599563598635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,4,power_law_1.2,0.2836735963821411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,8,balanced,0.16792533795038858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,8,balanced,0.17081065972646078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,8,power_law_1.01,0.18195199966430664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,8,power_law_1.01,0.19420160055160524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,8,power_law_1.2,0.19567999839782715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,1,8,power_law_1.2,0.19646719694137574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,16,1,balanced,0.08284799754619598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,16,1,balanced,0.08308800061543782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,16,1,power_law_1.01,0.08428159952163697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,16,1,power_law_1.01,0.08598399758338929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,16,1,power_law_1.2,0.0863103985786438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,16,1,power_law_1.2,0.08698880076408386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,2,1,balanced,0.43483734130859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,2,1,balanced,0.46776000658671063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,2,1,power_law_1.01,0.42808961868286133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,2,1,power_law_1.01,0.43303680419921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,2,1,power_law_1.2,0.42739200592041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,2,1,power_law_1.2,0.4285952091217041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,32,1,balanced,0.06591466565926869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,32,1,balanced,0.06621333460013072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,32,1,power_law_1.01,0.06380159854888916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,32,1,power_law_1.01,0.06408320069313049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,32,1,power_law_1.2,0.06292480230331421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,32,1,power_law_1.2,0.0636672019958496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,4,1,balanced,0.23265065749486288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,4,1,balanced,0.2508053382237752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,4,1,power_law_1.01,0.22956159114837646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,4,1,power_law_1.01,0.23136000633239745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,4,1,power_law_1.2,0.23143680095672609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,4,1,power_law_1.2,0.23186559677124025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,8,1,balanced,0.1280693312486013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,8,1,balanced,0.1414400041103363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,8,1,power_law_1.01,0.12573440074920655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,8,1,power_law_1.01,0.12603520154953002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,8,1,power_law_1.2,0.12811520099639892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,16384,2,8,8,1,power_law_1.2,0.13121919631958007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,1,balanced,2.7917493184407554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,1,balanced,2.8759520848592124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,1,power_law_1.01,1.9925952911376954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,1,power_law_1.01,2.0143808364868163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,1,power_law_1.2,2.0001087188720703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,1,power_law_1.2,2.0120895385742186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,128,balanced,0.08449066678682964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,128,balanced,0.08463999629020691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,128,power_law_1.01,0.0832319974899292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,128,power_law_1.01,0.08415359854698182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,128,power_law_1.2,0.08344320058822632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,128,power_law_1.2,0.08366720080375671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,16,balanced,0.23111999034881592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,16,balanced,0.2325013279914856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,16,power_law_1.01,0.21231999397277831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,16,power_law_1.01,0.2204927921295166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,16,power_law_1.2,0.2102976083755493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,16,power_law_1.2,0.2239232063293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,2,balanced,1.4287999471028645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,2,balanced,1.4291680653889973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,2,power_law_1.01,1.0984448432922362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,2,power_law_1.01,1.1663552284240724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,2,power_law_1.2,0.9990655899047851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,2,power_law_1.2,1.0579903602600098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,256,balanced,0.06866133213043213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,256,balanced,0.06942933301130931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,256,power_law_1.01,0.06733440160751343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,256,power_law_1.01,0.06996480226516724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,256,power_law_1.2,0.06691840291023254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,256,power_law_1.2,0.06747519969940186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,32,balanced,0.1395199994246165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,32,balanced,0.13987200458844504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,32,power_law_1.01,0.1299839973449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,32,power_law_1.01,0.13026560544967652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,32,power_law_1.2,0.12618240118026733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,32,power_law_1.2,0.13226239681243895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,4,balanced,0.7441386381785074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,4,balanced,0.7444427013397217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,4,power_law_1.01,0.5973055839538575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,4,power_law_1.01,0.6355072021484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,4,power_law_1.2,0.5978496074676514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,4,power_law_1.2,0.6043712139129639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,64,balanced,0.1034346620241801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,64,balanced,0.10534399747848511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,64,power_law_1.01,0.09902080297470092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,64,power_law_1.01,0.09996799826622009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,64,power_law_1.2,0.09317759871482849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,64,power_law_1.2,0.10214400291442871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,8,balanced,0.4203946590423584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,8,balanced,0.4222613175710042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,8,power_law_1.01,0.34609920978546144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,8,power_law_1.01,0.3968832015991211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,8,power_law_1.2,0.339737606048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,1,8,power_law_1.2,0.38224000930786134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,16,1,balanced,0.30900800228118896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,16,1,balanced,0.30990399916966754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,16,1,power_law_1.01,0.2555583953857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,16,1,power_law_1.01,0.2605504035949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,16,1,power_law_1.2,0.24865279197692872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,16,1,power_law_1.2,0.2548095941543579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,2,1,balanced,1.4530933698018391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,2,1,balanced,1.4593493143717449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,2,1,power_law_1.01,1.0613696098327636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,2,1,power_law_1.01,1.087782382965088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,2,1,power_law_1.2,1.0304448127746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,2,1,power_law_1.2,1.0448575973510743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,32,1,balanced,0.2444159984588623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,32,1,balanced,0.24474666515986124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,32,1,power_law_1.01,0.1883903980255127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,32,1,power_law_1.01,0.191046404838562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,32,1,power_law_1.2,0.18429440259933472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,32,1,power_law_1.2,0.1845952033996582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,4,1,balanced,0.7771360079447428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,4,1,balanced,0.7773173650105795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,4,1,power_law_1.01,0.5662720203399658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,4,1,power_law_1.01,0.5817599773406983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,4,1,power_law_1.2,0.551206398010254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,4,1,power_law_1.2,0.5647168159484863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,8,1,balanced,0.48023998737335205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,8,1,balanced,0.4814666509628296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,8,1,power_law_1.01,0.35437440872192383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,8,1,power_law_1.01,0.36362879276275634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,8,1,power_law_1.2,0.3546560049057007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2048,8,256,8,1,power_law_1.2,0.3618495941162109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,1,balanced,2.2023092905680337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,1,balanced,2.2031733194986978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,1,power_law_1.01,1.8182655334472657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,1,power_law_1.01,1.829644775390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,1,power_law_1.2,1.8186304092407226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,1,power_law_1.2,1.8695552825927735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,16,balanced,0.20419732729593912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,16,balanced,0.2092319925626119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,16,power_law_1.01,0.1797824025154114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,16,power_law_1.01,0.1889407992362976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,16,power_law_1.2,0.1871616005897522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,16,power_law_1.2,0.19063040018081664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,2,balanced,1.1287840207417805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,2,balanced,1.1288106441497803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,2,power_law_1.01,0.9564224243164062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,2,power_law_1.01,0.9834688186645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,2,power_law_1.2,0.951699161529541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,2,power_law_1.2,0.9749504089355469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,32,balanced,0.11914666493733723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,32,balanced,0.1204746663570404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,32,power_law_1.01,0.11544959545135498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,32,power_law_1.01,0.1186560034751892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,32,power_law_1.2,0.1124608039855957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,32,power_law_1.2,0.11560959815979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,4,balanced,0.6118293205897013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,4,balanced,0.6132373412450155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,4,power_law_1.01,0.5228735923767089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,4,power_law_1.01,0.5589568138122558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,4,power_law_1.2,0.5056960105895996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,4,power_law_1.2,0.5396607875823974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,8,balanced,0.327455997467041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,8,balanced,0.32945066690444946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,8,power_law_1.01,0.305132794380188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,8,power_law_1.01,0.3109312057495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,8,power_law_1.2,0.29921278953552244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,1,8,power_law_1.2,0.317523193359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,16,1,balanced,0.27501867214838666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,16,1,balanced,0.2792373299598694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,16,1,power_law_1.01,0.23055360317230225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,16,1,power_law_1.01,0.23070080280303956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,16,1,power_law_1.2,0.23390719890594483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,16,1,power_law_1.2,0.24075520038604736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,2,1,balanced,1.1285226345062256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,2,1,balanced,1.1307573318481445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,2,1,power_law_1.01,0.9377728462219238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,2,1,power_law_1.01,0.9442560195922851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,2,1,power_law_1.2,0.9443903923034668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,2,1,power_law_1.2,0.9483584403991699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,32,1,balanced,0.18340800205866495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,32,1,balanced,0.18475200732549033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,32,1,power_law_1.01,0.15593600273132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,32,1,power_law_1.01,0.15849599838256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,32,1,power_law_1.2,0.15550719499588012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,32,1,power_law_1.2,0.15555200576782227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,4,1,balanced,0.631114681561788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,4,1,balanced,0.6440693140029907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,4,1,power_law_1.01,0.5207808017730713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,4,1,power_law_1.01,0.5237887859344482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,4,1,power_law_1.2,0.5184832096099854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,4,1,power_law_1.2,0.5259903907775879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,8,1,balanced,0.3739039897918701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,8,1,balanced,0.3744000196456909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,8,1,power_law_1.01,0.3258368015289307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,8,1,power_law_1.01,0.32683520317077636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,8,1,power_law_1.2,0.3259007930755615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,6144,2560,8,160,8,1,power_law_1.2,0.3268224000930786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,1,balanced,3.254026730855306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,1,balanced,3.255242665608724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,1,power_law_1.01,2.3467967987060545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,1,power_law_1.01,2.3602495193481445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,1,power_law_1.2,2.375833511352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,1,power_law_1.2,2.3775808334350588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,128,balanced,0.09541333715120952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,128,balanced,0.0960586667060852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,128,power_law_1.01,0.09377279877662659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,128,power_law_1.01,0.0939136028289795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,128,power_law_1.2,0.09334400296211243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,128,power_law_1.2,0.09388800263404846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,16,balanced,0.2678239941596985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,16,balanced,0.27297600110371906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,16,power_law_1.01,0.24661760330200194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,16,power_law_1.01,0.2473088026046753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,16,power_law_1.2,0.2363136053085327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,16,power_law_1.2,0.24949119091033936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,2,balanced,1.6550827026367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,2,balanced,1.667151927947998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,2,power_law_1.01,1.2878656387329102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,2,power_law_1.01,1.2894975662231445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,2,power_law_1.2,1.2229951858520507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,2,power_law_1.2,1.237945556640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,256,balanced,0.0804799993832906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,256,balanced,0.08257600168387096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,256,power_law_1.01,0.07975680232048035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,256,power_law_1.01,0.08027520179748535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,256,power_law_1.2,0.07858560085296631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,256,power_law_1.2,0.07992320060729981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,32,balanced,0.15683199961980185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,32,balanced,0.1578986644744873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,32,power_law_1.01,0.1494976043701172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,32,power_law_1.01,0.150655996799469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,32,power_law_1.2,0.14696320295333862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,32,power_law_1.2,0.15148160457611085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,4,balanced,0.8606773217519125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,4,balanced,0.8630186716715494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,4,power_law_1.01,0.7523583889007568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,4,power_law_1.01,0.7712319850921631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,4,power_law_1.2,0.7463808059692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,4,power_law_1.2,0.7897984027862549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,64,balanced,0.11761599779129028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,64,balanced,0.11930666367212932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,64,power_law_1.01,0.11550079584121704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,64,power_law_1.01,0.11681920289993286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,64,power_law_1.2,0.10945279598236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,64,power_law_1.2,0.11274240016937256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,8,balanced,0.48603200912475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,8,balanced,0.4987786610921224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,8,power_law_1.01,0.42342400550842285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,8,power_law_1.01,0.45180158615112304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,8,power_law_1.2,0.42378878593444824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,1,8,power_law_1.2,0.447219181060791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,16,1,balanced,0.3561600049336751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,16,1,balanced,0.3568426767985026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,16,1,power_law_1.01,0.2887295961380005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,16,1,power_law_1.01,0.2932800054550171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,16,1,power_law_1.2,0.2884160041809082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,16,1,power_law_1.2,0.2900736093521118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,2,1,balanced,1.6907413800557454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,2,1,balanced,1.7267573674519856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,2,1,power_law_1.01,1.2412544250488282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,2,1,power_law_1.01,1.25600004196167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,2,1,power_law_1.2,1.2027071952819823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,2,1,power_law_1.2,1.2232704162597656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,32,1,balanced,0.2799359957377116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,32,1,balanced,0.28012265761693317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,32,1,power_law_1.01,0.21389439105987548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,32,1,power_law_1.01,0.21692800521850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,32,1,power_law_1.2,0.2136320114135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,32,1,power_law_1.2,0.2149951934814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,4,1,balanced,0.9013226826985677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,4,1,balanced,0.9365812937418619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,4,1,power_law_1.01,0.6527040004730225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,4,1,power_law_1.01,0.6708864212036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,4,1,power_law_1.2,0.6486527919769287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,4,1,power_law_1.2,0.6594816207885742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,8,1,balanced,0.5572906732559204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,8,1,balanced,0.5579306681950887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,8,1,power_law_1.01,0.4185344219207764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,8,1,power_law_1.01,0.4197120189666748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,8,1,power_law_1.2,0.40712318420410154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,256,8,1,power_law_1.2,0.41619200706481935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,1,balanced,5.095882733662923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,1,balanced,5.115488052368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,1,power_law_1.01,2.445523262023926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,1,power_law_1.01,2.534566307067871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,1,power_law_1.2,2.2453311920166015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,1,power_law_1.2,2.2938880920410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,128,balanced,0.11059733231862386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,128,balanced,0.11124799648920695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,128,power_law_1.01,0.10648959875106812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,128,power_law_1.01,0.10851839780807496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,128,power_law_1.2,0.10536960363388062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,128,power_law_1.2,0.10647039413452149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,16,balanced,0.383786678314209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,16,balanced,0.3840959866841634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,16,power_law_1.01,0.3153408050537109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,16,power_law_1.01,0.34064640998840334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,16,power_law_1.2,0.3043839931488037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,16,power_law_1.2,0.31687679290771487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,2,balanced,2.477519989013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,2,balanced,2.511610666910807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,2,power_law_1.01,1.410591983795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,2,power_law_1.01,1.4502911567687988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,2,power_law_1.2,1.3713855743408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,2,power_law_1.2,1.4076416015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,32,balanced,0.2445546587308248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,32,balanced,0.24700266122817993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,32,power_law_1.01,0.19464319944381714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,32,power_law_1.01,0.22231678962707518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,32,power_law_1.2,0.21063680648803712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,32,power_law_1.2,0.22758400440216064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,4,balanced,1.2834400335947673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,4,balanced,1.2851093610127766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,4,power_law_1.01,0.8502592086791992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,4,power_law_1.01,0.8664128303527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,4,power_law_1.2,0.7168255805969238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,4,power_law_1.2,0.7878848075866699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,64,balanced,0.1536799967288971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,64,balanced,0.15439466635386148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,64,power_law_1.01,0.12966400384902954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,64,power_law_1.01,0.13277440071105956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,64,power_law_1.2,0.12540160417556762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,64,power_law_1.2,0.13482240438461304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,8,balanced,0.6928799947102865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,8,balanced,0.696773370107015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,8,power_law_1.01,0.5640128135681153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,8,power_law_1.01,0.5898047924041748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,8,power_law_1.2,0.5559552192687989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,1,8,power_law_1.2,0.6630655765533447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,16,1,balanced,0.5235840082168579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,16,1,balanced,0.5418399969736735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,16,1,power_law_1.01,0.30882558822631834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,16,1,power_law_1.01,0.31795198917388917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,16,1,power_law_1.2,0.2893183946609497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,16,1,power_law_1.2,0.2912447929382324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,2,1,balanced,2.515157381693522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,2,1,balanced,2.5258453687032065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,2,1,power_law_1.01,1.3097920417785645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,2,1,power_law_1.01,1.331833553314209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,2,1,power_law_1.2,1.1927103996276855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,2,1,power_law_1.2,1.2011839866638183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,32,1,balanced,0.43427733580271405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,32,1,balanced,0.437552014986674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,32,1,power_law_1.01,0.2413696050643921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,32,1,power_law_1.01,0.2450176000595093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,32,1,power_law_1.2,0.2182080030441284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,32,1,power_law_1.2,0.21865599155426024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,4,1,balanced,1.344154675801595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,4,1,balanced,1.364192008972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,4,1,power_law_1.01,0.7067967891693115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,4,1,power_law_1.01,0.7171648025512696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,4,1,power_law_1.2,0.648524808883667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,4,1,power_law_1.2,0.6590976238250732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,8,1,balanced,0.8046293258666992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,8,1,balanced,0.8077759742736816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,8,1,power_law_1.01,0.43457918167114257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,8,1,power_law_1.01,0.44035840034484863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,8,1,power_law_1.2,0.4147007942199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,48,7168,2048,8,384,8,1,power_law_1.2,0.41860480308532716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,1,balanced,0.24415467182795206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,1,balanced,0.24463999271392822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,1,power_law_1.01,0.2551039934158325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,1,power_law_1.01,0.25628159046173093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,1,power_law_1.2,0.25608320236206056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,1,power_law_1.2,0.25728640556335447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,128,balanced,0.06282133360703786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,128,balanced,0.06313600142796834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,128,power_law_1.01,0.06269440054893494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,128,power_law_1.01,0.06327040195465088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,128,power_law_1.2,0.06428160071372986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,128,power_law_1.2,0.06561279892921448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,16,balanced,0.07462400197982788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,16,balanced,0.07496533294518788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,16,power_law_1.01,0.07619839906692505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,16,power_law_1.01,0.0766975998878479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,16,power_law_1.2,0.07713279724121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,16,power_law_1.2,0.07793920040130616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,2,balanced,0.15553067127863565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,2,balanced,0.15852266550064087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,2,power_law_1.01,0.16220799684524537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,2,power_law_1.01,0.16591999530792237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,2,power_law_1.2,0.1701632022857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,2,power_law_1.2,0.17018239498138427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,32,balanced,0.062394668658574425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,32,balanced,0.0639466643333435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,32,power_law_1.01,0.06592640280723572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,32,power_law_1.01,0.06734079718589783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,32,power_law_1.2,0.06549760103225707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,32,power_law_1.2,0.06656640172004699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,4,balanced,0.10925867160161336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,4,balanced,0.10935999949773152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,4,power_law_1.01,0.11609599590301514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,4,power_law_1.01,0.11788159608840942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,4,power_law_1.2,0.1189568042755127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,4,power_law_1.2,0.12023680210113526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,64,balanced,0.06256533165772755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,64,balanced,0.0637600024541219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,64,power_law_1.01,0.0641152024269104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,64,power_law_1.01,0.06437119841575623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,64,power_law_1.2,0.06506879925727845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,64,power_law_1.2,0.06525440216064453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,8,balanced,0.08621333042780559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,8,balanced,0.08646933237711589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,8,power_law_1.01,0.0876800000667572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,8,power_law_1.01,0.0881663978099823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,8,power_law_1.2,0.09047679901123047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,1,8,power_law_1.2,0.09079679846763611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,2,1,balanced,0.14405866463979086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,2,1,balanced,0.1460853318373362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,2,1,power_law_1.01,0.15665919780731202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,2,1,power_law_1.01,0.15767040252685546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,2,1,power_law_1.2,0.15856000185012817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,2,1,power_law_1.2,0.1591871976852417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,4,1,balanced,0.09922666351000468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,4,1,balanced,0.09924800197283427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,4,1,power_law_1.01,0.11177599430084229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,4,1,power_law_1.01,0.11247999668121338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,4,1,power_law_1.2,0.11293439865112305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2048,768,8,128,4,1,power_law_1.2,0.11365760564804077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,1,balanced,0.6728479862213135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,1,balanced,0.6748853524525961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,1,power_law_1.01,0.7405824184417724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,1,power_law_1.01,0.7506944179534912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,1,power_law_1.2,0.7585536003112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,1,power_law_1.2,0.7622144222259521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,128,balanced,0.08474666873613994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,128,balanced,0.08475200335184734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,128,power_law_1.01,0.08640639781951905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,128,power_law_1.01,0.08688639998435974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,128,power_law_1.2,0.08796160221099854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,128,power_law_1.2,0.08853759765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,16,balanced,0.10494400064150493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,16,balanced,0.10512533783912659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,16,power_law_1.01,0.11222399473190307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,16,power_law_1.01,0.1133504033088684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,16,power_law_1.2,0.1142016053199768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,16,power_law_1.2,0.11834880113601684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,2,balanced,0.3781813383102417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,2,balanced,0.38259732723236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,2,power_law_1.01,0.37061760425567625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,2,power_law_1.01,0.3747648000717163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,2,power_law_1.2,0.36890881061553954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,2,power_law_1.2,0.3812351942062378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,32,balanced,0.09285866220792134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,32,balanced,0.0930613378683726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,32,power_law_1.01,0.09630720019340515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,32,power_law_1.01,0.09704319834709167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,32,power_law_1.2,0.09848319888114929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,32,power_law_1.2,0.09963520169258118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,4,balanced,0.23046932617823282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,4,balanced,0.23108800252278647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,4,power_law_1.01,0.22230401039123535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,4,power_law_1.01,0.2249216079711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,4,power_law_1.2,0.22599680423736573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,4,power_law_1.2,0.22787840366363527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,64,balanced,0.08949866890907288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,64,balanced,0.09082667032877605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,64,power_law_1.01,0.09146239757537841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,64,power_law_1.01,0.09198079705238342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,64,power_law_1.2,0.09393919706344604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,64,power_law_1.2,0.09516159892082214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,8,balanced,0.15499200423558554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,8,balanced,0.1567520002524058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,8,power_law_1.01,0.1576192021369934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,8,power_law_1.01,0.16335359811782837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,8,power_law_1.2,0.16167039871215821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,1,8,power_law_1.2,0.16324479579925538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,16,1,balanced,0.23219732443491617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,16,1,balanced,0.2322559952735901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,16,1,power_law_1.01,0.24041600227355958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,16,1,power_law_1.01,0.24202239513397217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,16,1,power_law_1.2,0.2493824005126953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,16,1,power_law_1.2,0.2524800062179565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,2,1,balanced,0.3624480168024699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,2,1,balanced,0.3641066551208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,2,1,power_law_1.01,0.35253119468688965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,2,1,power_law_1.01,0.3537408113479614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,2,1,power_law_1.2,0.36513919830322267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,2,1,power_law_1.2,0.3737087965011597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,32,1,balanced,0.1992853283882141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,32,1,balanced,0.1997226675351461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,32,1,power_law_1.01,0.20650238990783693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,32,1,power_law_1.01,0.2106112003326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,32,1,power_law_1.2,0.21561601161956787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,32,1,power_law_1.2,0.21748480796813965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,4,1,balanced,0.2193386753400167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,4,1,balanced,0.21964265902837118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,4,1,power_law_1.01,0.21440000534057618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,4,1,power_law_1.01,0.21517438888549806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,4,1,power_law_1.2,0.21527040004730225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,4,1,power_law_1.2,0.2167680025100708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,8,1,balanced,0.3335306644439697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,8,1,balanced,0.3351466655731201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,8,1,power_law_1.01,0.3464576005935669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,8,1,power_law_1.01,0.34936320781707764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,8,1,power_law_1.2,0.36087679862976074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,2688,1856,6,128,8,1,power_law_1.2,0.3652224063873291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,1,balanced,1.1768319606781006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,1,balanced,1.2122399806976318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,1,power_law_1.01,1.065888023376465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,1,power_law_1.01,1.0759679794311523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,1,power_law_1.2,1.1154879570007323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,1,power_law_1.2,1.115839958190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,128,balanced,0.12733333309491476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,128,balanced,0.127402663230896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,128,power_law_1.01,0.12702080011367797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,128,power_law_1.01,0.12743680477142333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,128,power_law_1.2,0.12794239521026612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,128,power_law_1.2,0.12842240333557128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,16,balanced,0.18479466438293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,16,balanced,0.18515199422836304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,16,power_law_1.01,0.18670079708099366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,16,power_law_1.01,0.19045759439468385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,16,power_law_1.2,0.19349119663238526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,16,power_law_1.2,0.19456640481948853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,2,balanced,0.6511306762695312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,2,balanced,0.6564106543858846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,2,power_law_1.01,0.5985983848571778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,2,power_law_1.01,0.6118656158447265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,2,power_law_1.2,0.6217152118682862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,2,power_law_1.2,0.6444032192230225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,256,balanced,0.1202826698621114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,256,balanced,0.12152533729871114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,256,power_law_1.01,0.12243200540542602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,256,power_law_1.01,0.12252800464630127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,256,power_law_1.2,0.12340480089187622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,256,power_law_1.2,0.12369920015335083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,32,balanced,0.1381066640218099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,32,balanced,0.1384213368097941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,32,power_law_1.01,0.14206080436706542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,32,power_law_1.01,0.1420799970626831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,32,power_law_1.2,0.14282239675521852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,32,power_law_1.2,0.14583679437637329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,4,balanced,0.387717326482137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,4,balanced,0.3880106608072917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,4,power_law_1.01,0.36278400421142576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,4,power_law_1.01,0.3684799909591675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,4,power_law_1.2,0.36988799571990966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,4,power_law_1.2,0.38027520179748536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,64,balanced,0.12950399518013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,64,balanced,0.1295199990272522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,64,power_law_1.01,0.12911360263824462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,64,power_law_1.01,0.12916480302810668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,64,power_law_1.2,0.1306496024131775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,64,power_law_1.2,0.13263360261917115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,8,balanced,0.24868800242741904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,8,balanced,0.2494773268699646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,8,power_law_1.01,0.2438271999359131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,8,power_law_1.01,0.24775679111480714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,8,power_law_1.2,0.24858880043029785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,1,8,power_law_1.2,0.2544127941131592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,16,1,balanced,0.17828800280888876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,16,1,balanced,0.1789919932683309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,16,1,power_law_1.01,0.17340799570083618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,16,1,power_law_1.01,0.17350399494171143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,16,1,power_law_1.2,0.1739840030670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,16,1,power_law_1.2,0.17669119834899902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,2,1,balanced,0.6229226589202881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,2,1,balanced,0.6240373452504476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,2,1,power_law_1.01,0.5708096027374268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,2,1,power_law_1.01,0.5711616039276123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,2,1,power_law_1.2,0.5951295852661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,2,1,power_law_1.2,0.5987264156341553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,32,1,balanced,0.1357919971148173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,32,1,balanced,0.13672533631324768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,32,1,power_law_1.01,0.13211519718170167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,32,1,power_law_1.01,0.1330623984336853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,32,1,power_law_1.2,0.134169602394104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,32,1,power_law_1.2,0.13467520475387573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,4,1,balanced,0.3559946616490682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,4,1,balanced,0.3563733498255412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,4,1,power_law_1.01,0.33342719078063965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,4,1,power_law_1.01,0.3354496002197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,4,1,power_law_1.2,0.3377984046936035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,4,1,power_law_1.2,0.34101119041442873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,8,1,balanced,0.22022932767868042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,8,1,balanced,0.22148799896240234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,8,1,power_law_1.01,0.2084928035736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,8,1,power_law_1.01,0.21109120845794677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,8,1,power_law_1.2,0.21335039138793946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,3072,1536,8,256,8,1,power_law_1.2,0.2165760040283203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,1,balanced,0.7636640071868896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,1,balanced,0.7648906707763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,1,power_law_1.01,0.9208959579467774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,1,power_law_1.01,0.9419967651367187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,1,power_law_1.2,0.9438464164733886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,1,power_law_1.2,0.9889216423034668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,2,balanced,0.4174986680348714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,2,balanced,0.4200906753540039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,2,power_law_1.01,0.6085824012756348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,2,power_law_1.01,0.6094592094421387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,2,power_law_1.2,0.6400383949279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,2,power_law_1.2,0.7082560062408447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,4,balanced,0.30662933985392254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,4,balanced,0.31141332785288495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,4,power_law_1.01,0.374726390838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,4,power_law_1.01,0.39246718883514403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,4,power_law_1.2,0.4065536022186279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,4,power_law_1.2,0.4225344181060791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,8,balanced,0.2576799988746643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,8,balanced,0.25804799795150757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,8,power_law_1.01,0.3125312089920044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,8,power_law_1.01,0.3288640022277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,8,power_law_1.2,0.34610559940338137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,1,8,power_law_1.2,0.3502655982971191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,16,1,balanced,0.08734400073687236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,16,1,balanced,0.08872000376383464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,16,1,power_law_1.01,0.08751360177993775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,16,1,power_law_1.01,0.08780159950256347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,16,1,power_law_1.2,0.08755199909210205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,16,1,power_law_1.2,0.08773120045661927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,2,1,balanced,0.39800532658894855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,2,1,balanced,0.3989599943161011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,2,1,power_law_1.01,0.4594751834869385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,2,1,power_law_1.01,0.4622528076171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,2,1,power_law_1.2,0.4567872047424316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,2,1,power_law_1.2,0.46114559173583985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,32,1,balanced,0.07357866565386455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,32,1,balanced,0.07540800174077351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,32,1,power_law_1.01,0.07392640113830566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,32,1,power_law_1.01,0.0748416006565094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,32,1,power_law_1.2,0.07409279942512512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,32,1,power_law_1.2,0.07454720139503479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,4,1,balanced,0.2254400054613749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,4,1,balanced,0.22553600867589316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,4,1,power_law_1.01,0.23555200099945067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,4,1,power_law_1.01,0.2386944055557251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,4,1,power_law_1.2,0.23549439907073974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,4,1,power_law_1.2,0.2374783992767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,8,1,balanced,0.14468266566594443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,8,1,balanced,0.14492266376813254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,8,1,power_law_1.01,0.14160000085830687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,8,1,power_law_1.01,0.14364800453186036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,8,1,power_law_1.2,0.14419840574264525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,14336,2,8,8,1,power_law_1.2,0.1452288031578064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,1,balanced,0.812496026357015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,1,balanced,0.8182079792022705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,1,power_law_1.01,0.8452672004699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,1,power_law_1.01,0.8621248245239258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,1,power_law_1.2,0.8668224334716796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,1,power_law_1.2,0.8786432266235351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,128,balanced,0.11351999640464783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,128,balanced,0.11556266744931538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,128,power_law_1.01,0.1148800015449524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,128,power_law_1.01,0.1152448058128357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,128,power_law_1.2,0.11743999719619751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,128,power_law_1.2,0.11825920343399048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,16,balanced,0.13962666193644205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,16,balanced,0.14030933380126953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,16,power_law_1.01,0.1518399953842163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,16,power_law_1.01,0.15482879877090455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,16,power_law_1.2,0.15310720205307007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,16,power_law_1.2,0.15856000185012817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,2,balanced,0.46621867020924884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,2,balanced,0.467578649520874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,2,power_law_1.01,0.487775993347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,2,power_law_1.01,0.4885824203491211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,2,power_law_1.2,0.49953279495239256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,2,power_law_1.2,0.506496000289917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,32,balanced,0.124399999777476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,32,balanced,0.1253439982732137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,32,power_law_1.01,0.12814079523086547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,32,power_law_1.01,0.12817280292510985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,32,power_law_1.2,0.13029119968414307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,32,power_law_1.2,0.13246079683303832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,4,balanced,0.2800160050392151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,4,balanced,0.281333327293396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,4,power_law_1.01,0.29616000652313235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,4,power_law_1.01,0.3111680030822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,4,power_law_1.2,0.3053056001663208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,4,power_law_1.2,0.3101183891296387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,64,balanced,0.11945066849390666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,64,balanced,0.12269866466522217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,64,power_law_1.01,0.12275840044021606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,64,power_law_1.01,0.12277760505676269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,64,power_law_1.2,0.12433279752731323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,64,power_law_1.2,0.12460800409317016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,8,balanced,0.1925440033276876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,8,balanced,0.19354132811228433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,8,power_law_1.01,0.20686719417572022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,8,power_law_1.01,0.20993919372558595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,8,power_law_1.2,0.21422719955444336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,1,8,power_law_1.2,0.21580159664154053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,16,1,balanced,0.13878933588663736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,16,1,balanced,0.13889066378275552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,16,1,power_law_1.01,0.1422592043876648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,16,1,power_law_1.01,0.1435520052909851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,16,1,power_law_1.2,0.14391679763793946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,16,1,power_law_1.2,0.1464319944381714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,2,1,balanced,0.4510879913965861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,2,1,balanced,0.4538346529006958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,2,1,power_law_1.01,0.46684799194335935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,2,1,power_law_1.01,0.4677760124206543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,2,1,power_law_1.2,0.4715712070465088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,2,1,power_law_1.2,0.4784063816070557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,32,1,balanced,0.12342933813730876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,32,1,balanced,0.1237600048383077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,32,1,power_law_1.01,0.12668800354003906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,32,1,power_law_1.01,0.12869759798049926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,32,1,power_law_1.2,0.1293503999710083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,32,1,power_law_1.2,0.1299008011817932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,4,1,balanced,0.2571093241373698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,4,1,balanced,0.2579039931297302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,4,1,power_law_1.01,0.2812544107437134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,4,1,power_law_1.01,0.28353281021118165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,4,1,power_law_1.2,0.28641281127929685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,4,1,power_law_1.2,0.2874176025390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,8,1,balanced,0.17145599921544394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,8,1,balanced,0.17298666636149088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,8,1,power_law_1.01,0.19818880558013915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,8,1,power_law_1.01,0.19871360063552856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,8,1,power_law_1.2,0.1974527955055237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,1536,8,128,8,1,power_law_1.2,0.1994752049446106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,1,balanced,5.629791895548503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,1,balanced,5.6362349192301435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,1,power_law_1.01,5.5474494934082035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,1,power_law_1.01,5.666828918457031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,1,power_law_1.2,5.605561447143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,1,power_law_1.2,5.61448974609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,128,balanced,0.4022773504257202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,128,balanced,0.40249598026275635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,128,power_law_1.01,0.41527681350708007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,128,power_law_1.01,0.41907200813293455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,128,power_law_1.2,0.427839994430542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,128,power_law_1.2,0.4303232192993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,16,balanced,0.7067413330078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,16,balanced,0.7076160113016764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,16,power_law_1.01,0.6894015789031982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,16,power_law_1.01,0.7002111911773682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,16,power_law_1.2,0.7113984107971192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,16,power_law_1.2,0.7224703788757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,2,balanced,3.0068639119466147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,2,balanced,3.0771681467692056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,2,power_law_1.01,2.869856071472168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,2,power_law_1.01,2.9156288146972655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,2,power_law_1.2,2.971104049682617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,2,power_law_1.2,3.03110408782959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,256,balanced,0.4018079837163289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,256,balanced,0.40298132101694745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,256,power_law_1.01,0.40769281387329104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,256,power_law_1.01,0.4088448047637939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,256,power_law_1.2,0.4137472152709961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,256,power_law_1.2,0.415231990814209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,32,balanced,0.5389973322550455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,32,balanced,0.5390133460362753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,32,power_law_1.01,0.5387328147888184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,32,power_law_1.01,0.54268798828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,32,power_law_1.2,0.5418623924255371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,32,power_law_1.2,0.5618879795074463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,4,balanced,1.634976069132487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,4,balanced,1.657541275024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,4,power_law_1.01,1.6363264083862306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,4,power_law_1.01,1.6481407165527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,4,power_law_1.2,1.6023359298706055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,4,power_law_1.2,1.6997312545776366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,64,balanced,0.43572266896565753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,64,balanced,0.4370559851328532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,64,power_law_1.01,0.47177600860595703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,64,power_law_1.01,0.4757887840270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,64,power_law_1.2,0.4786240100860596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,64,power_law_1.2,0.48108158111572263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,8,balanced,1.0136746565500896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,8,balanced,1.0144106547037761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,8,power_law_1.01,1.010758399963379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,8,power_law_1.01,1.015500831604004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,8,power_law_1.2,1.0247424125671387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,1,8,power_law_1.2,1.032051181793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,16,1,balanced,1.5173600514729817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,16,1,balanced,1.5179039637247722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,16,1,power_law_1.01,1.564025592803955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,16,1,power_law_1.01,1.564889621734619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,16,1,power_law_1.2,1.6241600036621093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,16,1,power_law_1.2,1.6244224548339843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,2,1,balanced,2.7361599604288735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,2,1,balanced,2.73853333791097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,2,1,power_law_1.01,3.041440010070801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,2,1,power_law_1.01,3.0509952545166015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,2,1,power_law_1.2,3.083270454406738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,2,1,power_law_1.2,3.167942428588867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,32,1,balanced,1.2051093578338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,32,1,balanced,1.2073973019917805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,32,1,power_law_1.01,1.2543359756469727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,32,1,power_law_1.01,1.2571264266967774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,32,1,power_law_1.2,1.2906496047973632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,32,1,power_law_1.2,1.298361587524414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,4,1,balanced,1.888330618540446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,4,1,balanced,1.907807985941569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,4,1,power_law_1.01,1.842732810974121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,4,1,power_law_1.01,1.8494848251342773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,4,1,power_law_1.2,1.9003519058227538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,4,1,power_law_1.2,1.9130687713623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,8,1,balanced,0.8363093535105387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,8,1,balanced,0.8429706891377767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,8,1,power_law_1.01,0.8365951538085937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,8,1,power_law_1.01,0.84335355758667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,8,1,power_law_1.2,0.8654591560363769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,4096,2688,22,512,8,1,power_law_1.2,0.8681344032287598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,1,balanced,1.339637279510498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,1,balanced,1.35097074508667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,1,power_law_1.01,1.6045759201049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,1,power_law_1.01,1.64901123046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,1,power_law_1.2,1.5822976112365723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,1,power_law_1.2,1.6063808441162108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,2,balanced,0.7023146947224935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,2,balanced,0.7042133013407389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,2,power_law_1.01,0.9572799682617188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,2,power_law_1.01,1.047379207611084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,2,power_law_1.2,1.0338432312011718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,2,power_law_1.2,1.0887231826782227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,4,balanced,0.41185065110524494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,4,balanced,0.41461865107218426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,4,power_law_1.01,0.5848703861236573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,4,power_law_1.01,0.5851136207580566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,4,power_law_1.2,0.5559423923492431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,4,power_law_1.2,0.5731264114379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,8,balanced,0.3272693355878194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,8,balanced,0.3304319977760315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,8,power_law_1.01,0.4448383808135986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,8,power_law_1.01,0.476255989074707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,8,power_law_1.2,0.4732351779937744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,1,8,power_law_1.2,0.47786240577697753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,16,1,balanced,0.11506666739781697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,16,1,balanced,0.11572800079981486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,16,1,power_law_1.01,0.1260032057762146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,16,1,power_law_1.01,0.12647039890289308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,16,1,power_law_1.2,0.12510080337524415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,16,1,power_law_1.2,0.12522879838943482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,2,1,balanced,0.6179306507110596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,2,1,balanced,0.6286453406016032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,2,1,power_law_1.01,0.7714111804962158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,2,1,power_law_1.01,0.7837823867797852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,2,1,power_law_1.2,0.758847999572754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,2,1,power_law_1.2,0.7671360015869141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,32,1,balanced,0.09890666604042053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,32,1,balanced,0.09914132952690125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,32,1,power_law_1.01,0.10263680219650269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,32,1,power_law_1.01,0.10433919429779052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,32,1,power_law_1.2,0.10308480262756348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,32,1,power_law_1.2,0.10347520112991333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,4,1,balanced,0.33372267087300617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,4,1,balanced,0.3383520046869914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,4,1,power_law_1.01,0.3748543977737427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,4,1,power_law_1.01,0.3863679885864258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,4,1,power_law_1.2,0.3759999990463257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,4,1,power_law_1.2,0.3926271915435791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,8,1,balanced,0.1981333295504252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,8,1,balanced,0.20124799013137817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,8,1,power_law_1.01,0.2125823974609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,8,1,power_law_1.01,0.21274240016937257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,8,1,power_law_1.2,0.20913279056549072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,16384,2,8,8,1,power_law_1.2,0.21320960521697999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,1,balanced,3.1804641087849936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,1,balanced,3.2286561330159507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,1,power_law_1.01,2.837459182739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,1,power_law_1.01,2.9419456481933595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,1,power_law_1.2,2.9540224075317383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,1,power_law_1.2,2.9862720489501955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,128,balanced,0.20325332880020142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,128,balanced,0.20519467194875082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,128,power_law_1.01,0.2073280096054077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,128,power_law_1.01,0.2090751886367798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,128,power_law_1.2,0.2092223882675171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,128,power_law_1.2,0.21172480583190917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,16,balanced,0.3675626516342163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,16,balanced,0.3683520158131917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,16,power_law_1.01,0.35306880474090574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,16,power_law_1.01,0.36620159149169923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,16,power_law_1.2,0.3531584024429321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,16,power_law_1.2,0.3563008069992065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,2,balanced,1.6533013979593914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,2,balanced,1.6583840052286785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,2,power_law_1.01,1.4691391944885255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,2,power_law_1.01,1.4704768180847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,2,power_law_1.2,1.5150464057922364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,2,power_law_1.2,1.5466879844665526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,256,balanced,0.19761067628860474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,256,balanced,0.1989226738611857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,256,power_law_1.01,0.19868799448013305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,256,power_law_1.01,0.19877760410308837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,256,power_law_1.2,0.2022655963897705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,256,power_law_1.2,0.2028736114501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,32,balanced,0.2515893379847209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,32,balanced,0.25261332591374713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,32,power_law_1.01,0.2607295989990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,32,power_law_1.01,0.27073919773101807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,32,power_law_1.2,0.26175999641418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,32,power_law_1.2,0.26207358837127687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,4,balanced,0.8886026541392008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,4,balanced,0.889509359995524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,4,power_law_1.01,0.8425151824951171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,4,power_law_1.01,0.8700160026550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,4,power_law_1.2,0.8540160179138183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,4,power_law_1.2,0.8671808242797852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,64,balanced,0.2095093329747518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,64,balanced,0.21086400747299194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,64,power_law_1.01,0.2166912078857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,64,power_law_1.01,0.2198848009109497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,64,power_law_1.2,0.21875839233398436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,64,power_law_1.2,0.2266752004623413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,8,balanced,0.5395946502685547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,8,balanced,0.5414826472600301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,8,power_law_1.01,0.5118080139160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,8,power_law_1.01,0.5145664215087891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,8,power_law_1.2,0.5292928218841553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,1,8,power_law_1.2,0.5304128170013428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,16,1,balanced,0.3492639859517415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,16,1,balanced,0.34991466999053955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,16,1,power_law_1.01,0.33793280124664304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,16,1,power_law_1.01,0.3385855913162231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,16,1,power_law_1.2,0.3390079975128174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,16,1,power_law_1.2,0.3396928071975708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,2,1,balanced,1.625871976216634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,2,1,balanced,1.6444427172342937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,2,1,power_law_1.01,1.4530495643615722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,2,1,power_law_1.01,1.467308807373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,2,1,power_law_1.2,1.4857215881347656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,2,1,power_law_1.2,1.514668846130371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,32,1,balanced,0.248416006565094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,32,1,balanced,0.24954134225845337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,32,1,power_law_1.01,0.24090240001678467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,32,1,power_law_1.01,0.24364800453186036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,32,1,power_law_1.2,0.24614400863647462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,32,1,power_law_1.2,0.24685440063476563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,4,1,balanced,0.8330826759338379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,4,1,balanced,0.8346986770629883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,4,1,power_law_1.01,0.7821375846862793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,4,1,power_law_1.01,0.7822400093078613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,4,1,power_law_1.2,0.7812992095947265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,4,1,power_law_1.2,0.7961664199829102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,8,1,balanced,0.5020480155944824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,8,1,balanced,0.502128005027771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,8,1,power_law_1.01,0.4761536121368408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,8,1,power_law_1.01,0.48122239112854004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,8,1,power_law_1.2,0.4819007873535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2048,8,256,8,1,power_law_1.2,0.48427519798278806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,1,balanced,2.5001866022745767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,1,balanced,2.512709299723307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,1,power_law_1.01,2.485887908935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,1,power_law_1.01,2.4878015518188477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,1,power_law_1.2,2.588684844970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,1,power_law_1.2,2.597747230529785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,16,balanced,0.3038880030314128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,16,balanced,0.3041386604309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,16,power_law_1.01,0.3091327905654907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,16,power_law_1.01,0.31036159992218015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,16,power_law_1.2,0.31420800685882566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,16,power_law_1.2,0.3149888038635254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,2,balanced,1.2876266638437908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,2,balanced,1.326149304707845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,2,power_law_1.01,1.3017087936401368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,2,power_law_1.01,1.313049602508545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,2,power_law_1.2,1.3618559837341309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,2,power_law_1.2,1.3699071884155274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,32,balanced,0.20110932985941568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,32,balanced,0.20204265912373862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,32,power_law_1.01,0.23916161060333252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,32,power_law_1.01,0.243340802192688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,32,power_law_1.2,0.2520319938659668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,32,power_law_1.2,0.25530879497528075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,4,balanced,0.711674690246582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,4,balanced,0.7130773067474365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,4,power_law_1.01,0.7437439918518066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,4,power_law_1.01,0.7515456199645996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,4,power_law_1.2,0.7444928169250489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,4,power_law_1.2,0.7676352024078369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,8,balanced,0.4335413376490275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,8,balanced,0.4371573527654012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,8,power_law_1.01,0.454252815246582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,8,power_law_1.01,0.46216959953308107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,8,power_law_1.2,0.46190080642700193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,1,8,power_law_1.2,0.46894078254699706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,16,1,balanced,0.290117343266805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,16,1,balanced,0.29051733016967773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,16,1,power_law_1.01,0.2926271915435791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,16,1,power_law_1.01,0.293887996673584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,16,1,power_law_1.2,0.2944576025009155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,16,1,power_law_1.2,0.295961594581604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,2,1,balanced,1.2806986967722576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,2,1,balanced,1.3108586470286052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,2,1,power_law_1.01,1.2491071701049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,2,1,power_law_1.01,1.264793586730957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,2,1,power_law_1.2,1.2777536392211915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,2,1,power_law_1.2,1.2827327728271485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,32,1,balanced,0.20899200439453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,32,1,balanced,0.20935465892155966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,32,1,power_law_1.01,0.2144767999649048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,32,1,power_law_1.01,0.215231990814209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,32,1,power_law_1.2,0.21583359241485595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,32,1,power_law_1.2,0.21650559902191163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,4,1,balanced,0.6742826302846273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,4,1,balanced,0.6785386403401693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,4,1,power_law_1.01,0.6715072154998779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,4,1,power_law_1.01,0.6973375797271728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,4,1,power_law_1.2,0.7041024208068848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,4,1,power_law_1.2,0.7076096057891845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,8,1,balanced,0.38471468289693195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,8,1,balanced,0.3850080172220866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,8,1,power_law_1.01,0.4203648090362549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,8,1,power_law_1.01,0.4231103897094727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,8,1,power_law_1.2,0.4252352237701416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,6144,2560,8,160,8,1,power_law_1.2,0.4285888195037842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,1,balanced,3.6961441040039062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,1,balanced,3.697744051615397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,1,power_law_1.01,3.3332096099853517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,1,power_law_1.01,3.3624576568603515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,1,power_law_1.2,3.483865737915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,1,power_law_1.2,3.4852542877197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,128,balanced,0.22874667247136435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,128,balanced,0.23030932744344076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,128,power_law_1.01,0.23009281158447265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,128,power_law_1.01,0.23226239681243896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,128,power_law_1.2,0.2330496072769165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,128,power_law_1.2,0.23510398864746093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,16,balanced,0.42479467391967773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,16,balanced,0.4275840123494466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,16,power_law_1.01,0.400486421585083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,16,power_law_1.01,0.41066880226135255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,16,power_law_1.2,0.40381441116333006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,16,power_law_1.2,0.40729598999023436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,2,balanced,1.9474612871805828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,2,balanced,1.949130694071452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,2,power_law_1.01,1.7199552536010743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,2,power_law_1.01,1.8178367614746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,2,power_law_1.2,1.7344831466674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,2,power_law_1.2,1.8133056640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,256,balanced,0.2218773365020752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,256,balanced,0.22368532419204712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,256,power_law_1.01,0.22053120136260987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,256,power_law_1.01,0.22154879570007324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,256,power_law_1.2,0.22335360050201417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,256,power_law_1.2,0.22446720600128173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,32,balanced,0.29253333806991577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,32,balanced,0.29319467147191364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,32,power_law_1.01,0.2839168071746826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,32,power_law_1.01,0.2932159900665283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,32,power_law_1.2,0.29484798908233645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,32,power_law_1.2,0.30001280307769773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,4,balanced,1.03110933303833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,4,balanced,1.0315679709116619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,4,power_law_1.01,0.9705920219421387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,4,power_law_1.01,1.0044159889221191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,4,power_law_1.2,1.0088128089904784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,4,power_law_1.2,1.0128000259399415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,64,balanced,0.23635200659434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,64,balanced,0.2370133399963379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,64,power_law_1.01,0.24344320297241212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,64,power_law_1.01,0.24395520687103273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,64,power_law_1.2,0.2534143924713135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,64,power_law_1.2,0.2537343978881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,8,balanced,0.6254560152689616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,8,balanced,0.6262933413187662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,8,power_law_1.01,0.6000512123107911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,8,power_law_1.01,0.6115647792816162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,8,power_law_1.2,0.6016831874847413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,1,8,power_law_1.2,0.6144959926605225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,16,1,balanced,0.40531734625498456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,16,1,balanced,0.4059306780497233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,16,1,power_law_1.01,0.3882816076278687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,16,1,power_law_1.01,0.3923583984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,16,1,power_law_1.2,0.3896768093109131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,16,1,power_law_1.2,0.39571199417114256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,2,1,balanced,1.8809386889139812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,2,1,balanced,1.9323412577311199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,2,1,power_law_1.01,1.6656831741333007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,2,1,power_law_1.01,1.675929641723633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,2,1,power_law_1.2,1.7355392456054688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,2,1,power_law_1.2,1.7695743560791015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,32,1,balanced,0.28540800015131634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,32,1,balanced,0.2869386672973633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,32,1,power_law_1.01,0.2778048038482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,32,1,power_law_1.01,0.28066558837890626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,32,1,power_law_1.2,0.28373119831085203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,32,1,power_law_1.2,0.28596479892730714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,4,1,balanced,0.9732106526692709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,4,1,balanced,0.9830826918284098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,4,1,power_law_1.01,0.9115776062011719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,4,1,power_law_1.01,0.9129216194152832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,4,1,power_law_1.2,0.9173695564270019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,4,1,power_law_1.2,0.9219903945922852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,8,1,balanced,0.5852959950764974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,8,1,balanced,0.5875893433888754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,8,1,power_law_1.01,0.5573503971099854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,8,1,power_law_1.01,0.5595776081085205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,8,1,power_law_1.2,0.5594624042510986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,256,8,1,power_law_1.2,0.5659200191497803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,1,balanced,5.500352223714192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,1,balanced,5.622293472290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,1,power_law_1.01,4.651411056518555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,1,power_law_1.01,4.684454345703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,1,power_law_1.2,4.650323104858399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,1,power_law_1.2,4.719065475463867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,128,balanced,0.28807999690373737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,128,balanced,0.28869332869847614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,128,power_law_1.01,0.28550400733947756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,128,power_law_1.01,0.2876032114028931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,128,power_law_1.2,0.2915519952774048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,128,power_law_1.2,0.295411205291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,16,balanced,0.5669866800308228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,16,balanced,0.56877334912618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,16,power_law_1.01,0.5253952026367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,16,power_law_1.01,0.537004804611206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,16,power_law_1.2,0.5154623985290527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,16,power_law_1.2,0.5529024124145507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,2,balanced,2.8598505655924478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,2,balanced,2.895301183064779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,2,power_law_1.01,2.4582719802856445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,2,power_law_1.01,2.517612838745117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,2,power_law_1.2,2.3861888885498046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,2,power_law_1.2,2.4697088241577148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,32,balanced,0.40770665804545086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,32,balanced,0.40858133633931476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,32,power_law_1.01,0.3873408079147339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,32,power_law_1.01,0.3952320098876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,32,power_law_1.2,0.40860800743103026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,32,power_law_1.2,0.41199359893798826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,4,balanced,1.5061333974202473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,4,balanced,1.508805274963379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,4,power_law_1.01,1.3325759887695312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,4,power_law_1.01,1.3578495979309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,4,power_law_1.2,1.3314240455627442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,4,power_law_1.2,1.3554816246032715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,64,balanced,0.30617600679397583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,64,balanced,0.3092106580734253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,64,power_law_1.01,0.3022144079208374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,64,power_law_1.01,0.30483839511871336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,64,power_law_1.2,0.3174272060394287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,64,power_law_1.2,0.321996808052063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,8,balanced,0.8790132999420166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,8,balanced,0.8839466571807861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,8,power_law_1.01,0.7733312129974366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,8,power_law_1.01,0.806982421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,8,power_law_1.2,0.8211135864257812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,1,8,power_law_1.2,0.8217727661132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,16,1,balanced,0.5232693354288737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,16,1,balanced,0.5245279868443807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,16,1,power_law_1.01,0.47733120918273925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,16,1,power_law_1.01,0.47817602157592776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,16,1,power_law_1.2,0.478656005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,16,1,power_law_1.2,0.4799359798431396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,2,1,balanced,2.7927093505859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,2,1,balanced,2.79313055674235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,2,1,power_law_1.01,2.337497520446777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,2,1,power_law_1.01,2.346099281311035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,2,1,power_law_1.2,2.332032012939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,2,1,power_law_1.2,2.3465919494628906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,32,1,balanced,0.3833119869232178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,32,1,balanced,0.38436798254648846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,32,1,power_law_1.01,0.3501120090484619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,32,1,power_law_1.01,0.3510335922241211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,32,1,power_law_1.2,0.3568063974380493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,32,1,power_law_1.2,0.35840640068054197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,4,1,balanced,1.4170559247334797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,4,1,balanced,1.4582773844401042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,4,1,power_law_1.01,1.1985152244567872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,4,1,power_law_1.01,1.2382464408874512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,4,1,power_law_1.2,1.2319040298461914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,4,1,power_law_1.2,1.2610495567321778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,8,1,balanced,0.8197387059529623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,8,1,balanced,0.8200533390045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,8,1,power_law_1.01,0.697215986251831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,8,1,power_law_1.01,0.7153600215911865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,8,1,power_law_1.2,0.7381631851196289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,512,7168,2048,8,384,8,1,power_law_1.2,0.7431424140930176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,1,balanced,0.7842506567637125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,1,balanced,0.7849226792653402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,1,power_law_1.01,0.8337151527404785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,1,power_law_1.01,0.8440383911132813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,1,power_law_1.2,0.850649642944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,1,power_law_1.2,0.8514304161071777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,128,balanced,0.3160799940427144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,128,balanced,0.31754666566848755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,128,power_law_1.01,0.34387199878692626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,128,power_law_1.01,0.34800000190734864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,128,power_law_1.2,0.3695487976074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,128,power_law_1.2,0.37182719707489015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,16,balanced,0.34669868151346844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,16,balanced,0.3479573329289754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,16,power_law_1.01,0.3872064113616943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,16,power_law_1.01,0.3905280113220215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,16,power_law_1.2,0.40113282203674316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,16,power_law_1.2,0.40919041633605957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,2,balanced,0.5836693445841471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,2,balanced,0.5859893163045248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,2,power_law_1.01,0.6417280197143554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,2,power_law_1.01,0.6504640102386474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,2,power_law_1.2,0.6642047882080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,2,power_law_1.2,0.6688511848449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,32,balanced,0.3287893335024516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,32,balanced,0.32915733257929486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,32,power_law_1.01,0.3669696092605591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,32,power_law_1.01,0.37280640602111814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,32,power_law_1.2,0.38646399974823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,32,power_law_1.2,0.3892672061920166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,4,balanced,0.45201067129770917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,4,balanced,0.45229331652323407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,4,power_law_1.01,0.5094399929046631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,4,power_law_1.01,0.5137919902801513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,4,power_law_1.2,0.5208831787109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,4,power_law_1.2,0.5388415813446045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,64,balanced,0.3208746711413066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,64,balanced,0.3209120035171509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,64,power_law_1.01,0.35075840950012205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,64,power_law_1.01,0.3564224004745483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,64,power_law_1.2,0.3722111940383911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,64,power_law_1.2,0.3798784017562866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,8,balanced,0.3821599880854289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,8,balanced,0.3821920156478882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,8,power_law_1.01,0.429036808013916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,8,power_law_1.01,0.4332287788391113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,8,power_law_1.2,0.4557375907897949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,1,8,power_law_1.2,0.4618239879608154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,2,1,balanced,0.5094346602757772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,2,1,balanced,0.5130133231480917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,2,1,power_law_1.01,0.5667136192321778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,2,1,power_law_1.01,0.567577600479126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,2,1,power_law_1.2,0.5704703807830811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,2,1,power_law_1.2,0.5732351779937744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,4,1,balanced,0.37592001756032306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,4,1,balanced,0.37625598907470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,4,1,power_law_1.01,0.4135615825653076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,4,1,power_law_1.01,0.4153088092803955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,4,1,power_law_1.2,0.41621761322021483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2048,768,8,128,4,1,power_law_1.2,0.416428804397583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,1,balanced,1.7793866793314617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,1,balanced,1.7969013849894206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,1,power_law_1.01,1.765875244140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,1,power_law_1.01,1.7725120544433595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,1,power_law_1.2,1.782054328918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,1,power_law_1.2,1.8126335144042969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,128,balanced,0.41713066895802814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,128,balanced,0.417466680208842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,128,power_law_1.01,0.4656191825866699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,128,power_law_1.01,0.4693120002746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,128,power_law_1.2,0.5322751998901367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,128,power_law_1.2,0.5390655994415283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,16,balanced,0.5021440188090006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,16,balanced,0.5030773480733236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,16,power_law_1.01,0.5659711837768555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,16,power_law_1.01,0.5865536212921143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,16,power_law_1.2,0.6284607887268067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,16,power_law_1.2,0.6655424118041993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,2,balanced,1.1644852956136067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,2,balanced,1.1683306694030762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,2,power_law_1.01,1.2119808197021484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,2,power_law_1.01,1.2150912284851074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,2,power_law_1.2,1.2281472206115722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,2,power_law_1.2,1.3160703659057618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,32,balanced,0.45334935188293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,32,balanced,0.454309344291687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,32,power_law_1.01,0.504582405090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,32,power_law_1.01,0.5220096111297607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,32,power_law_1.2,0.568064022064209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,32,power_law_1.2,0.5690239906311035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,4,balanced,0.7986773649851481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,4,balanced,0.8005812962849935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,4,power_law_1.01,0.8336064338684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,4,power_law_1.01,0.8382847785949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,4,power_law_1.2,0.9151679992675781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,4,power_law_1.2,0.9434687614440918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,64,balanced,0.4272746642430623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,64,balanced,0.4285546541213989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,64,power_law_1.01,0.49112958908081056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,64,power_law_1.01,0.49149441719055176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,64,power_law_1.2,0.5423359870910645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,64,power_law_1.2,0.5529280185699463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,8,balanced,0.6031413475672404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,8,balanced,0.6040960152943929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,8,power_law_1.01,0.6728064060211182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,8,power_law_1.01,0.680076789855957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,8,power_law_1.2,0.7349440097808838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,1,8,power_law_1.2,0.7549439907073975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,16,1,balanced,0.8313546975453695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,16,1,balanced,0.8339040279388428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,16,1,power_law_1.01,0.8205632209777832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,16,1,power_law_1.01,0.8295552253723144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,16,1,power_law_1.2,0.8393152236938477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,16,1,power_law_1.2,0.8403840065002441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,2,1,balanced,1.1061653296152751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,2,1,balanced,1.1087360382080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,2,1,power_law_1.01,1.0882944107055663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,2,1,power_law_1.01,1.1030591964721679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,2,1,power_law_1.2,1.1134592056274415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,2,1,power_law_1.2,1.119270420074463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,32,1,balanced,0.6804693539937338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,32,1,balanced,0.6815360387166342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,32,1,power_law_1.01,0.6801152229309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,32,1,power_law_1.01,0.6815296173095703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,32,1,power_law_1.2,0.6835264205932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,32,1,power_law_1.2,0.688640022277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,4,1,balanced,0.7139519850413004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,4,1,balanced,0.7147413094838461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,4,1,power_law_1.01,0.7037183761596679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,4,1,power_law_1.01,0.7063615798950196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,4,1,power_law_1.2,0.7180863857269287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,4,1,power_law_1.2,0.7252992153167724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,8,1,balanced,1.046720027923584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,8,1,balanced,1.04857603708903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,8,1,power_law_1.01,1.0391167640686034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,8,1,power_law_1.01,1.0415103912353516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,8,1,power_law_1.2,1.055622386932373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,2688,1856,6,128,8,1,power_law_1.2,1.0581439971923827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,1,balanced,2.7158613204956055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,1,balanced,2.8172267278035483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,1,power_law_1.01,2.7595775604248045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,1,power_law_1.01,2.780735969543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,1,power_law_1.2,2.7599424362182616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,1,power_law_1.2,2.844441604614258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,128,balanced,0.504858652750651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,128,balanced,0.5062666734059652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,128,power_law_1.01,0.5579904079437256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,128,power_law_1.01,0.561190414428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,128,power_law_1.2,0.5792191982269287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,128,power_law_1.2,0.5952064037322998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,16,balanced,0.6245973507563273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,16,balanced,0.6280320088068644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,16,power_law_1.01,0.7047872066497802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,16,power_law_1.01,0.7095871925354004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,16,power_law_1.2,0.7524159908294678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,16,power_law_1.2,0.7652607917785644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,2,balanced,1.556869347890218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,2,balanced,1.5662986437479656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,2,power_law_1.01,1.6893632888793946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,2,power_law_1.01,1.6980159759521485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,2,power_law_1.2,1.7363967895507812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,2,power_law_1.2,1.7533695220947265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,256,balanced,0.4984000126520793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,256,balanced,0.4997599919637044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,256,power_law_1.01,0.5368639945983886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,256,power_law_1.01,0.5381247997283936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,256,power_law_1.2,0.5795455932617187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,256,power_law_1.2,0.5805632114410401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,32,balanced,0.5572906732559204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,32,balanced,0.5582666794459025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,32,power_law_1.01,0.6264512062072753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,32,power_law_1.01,0.6301504135131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,32,power_law_1.2,0.6436800003051758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,32,power_law_1.2,0.6652736186981201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,4,balanced,1.0252319971720378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,4,balanced,1.028106689453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,4,power_law_1.01,1.1229311943054199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,4,power_law_1.01,1.141145610809326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,4,power_law_1.2,1.151033592224121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,4,power_law_1.2,1.1642560005187987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,64,balanced,0.5204960107803345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,64,balanced,0.5218240022659302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,64,power_law_1.01,0.5765247821807862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,64,power_law_1.01,0.5776832103729248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,64,power_law_1.2,0.613324785232544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,64,power_law_1.2,0.6352191925048828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,8,balanced,0.7619093259175619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,8,balanced,0.7640266418457031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,8,power_law_1.01,0.8462656021118165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,8,power_law_1.01,0.849516773223877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,8,power_law_1.2,0.867795181274414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,1,8,power_law_1.2,0.9486144065856934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,16,1,balanced,0.5430826743443807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,16,1,balanced,0.5431946516036987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,16,1,power_law_1.01,0.5658304214477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,16,1,power_law_1.01,0.5663616180419921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,16,1,power_law_1.2,0.5738495826721192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,16,1,power_law_1.2,0.5741184234619141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,2,1,balanced,1.460426648457845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,2,1,balanced,1.4761652946472168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,2,1,power_law_1.01,1.5339648246765136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,2,1,power_law_1.01,1.5576255798339844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,2,1,power_law_1.2,1.5777983665466309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,2,1,power_law_1.2,1.5838208198547363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,32,1,balanced,0.4519146680831909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,32,1,balanced,0.454037348429362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,32,1,power_law_1.01,0.475219202041626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,32,1,power_law_1.01,0.4752255916595459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,32,1,power_law_1.2,0.4806464195251465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,32,1,power_law_1.2,0.48105602264404296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,4,1,balanced,0.9098933537801107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,4,1,balanced,0.9121812979380289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,4,1,power_law_1.01,0.9557439804077148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,4,1,power_law_1.01,0.9562496185302735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,4,1,power_law_1.2,0.9731200218200684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,4,1,power_law_1.2,0.9745152473449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,8,1,balanced,0.650597333908081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,8,1,balanced,0.6519146760304769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,8,1,power_law_1.01,0.6751552104949952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,8,1,power_law_1.01,0.6751935958862305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,8,1,power_law_1.2,0.6908607959747315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,3072,1536,8,256,8,1,power_law_1.2,0.6918335914611816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,1,balanced,5.112101236979167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,1,balanced,5.17849063873291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,1,power_law_1.01,5.126252746582031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,1,power_law_1.01,5.1660606384277346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,1,power_law_1.2,5.14392318725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,1,power_law_1.2,5.238278579711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,2,balanced,2.8086185455322266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,2,balanced,2.9150028228759766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,2,power_law_1.01,3.5159679412841798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,2,power_law_1.01,3.8596160888671873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,2,power_law_1.2,3.6992897033691405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,2,power_law_1.2,4.291334533691407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,4,balanced,1.6713600158691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,4,balanced,1.6872480710347493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,4,power_law_1.01,2.6813888549804688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,4,power_law_1.01,2.885798454284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,4,power_law_1.2,3.103673553466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,4,power_law_1.2,3.1749311447143556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,8,balanced,1.189674695332845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,8,balanced,1.1928586959838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,8,power_law_1.01,2.311609649658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,8,power_law_1.01,2.672422409057617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,8,power_law_1.2,2.5703359603881837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,1,8,power_law_1.2,2.606585693359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,16,1,balanced,0.4015626509984334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,16,1,balanced,0.4040693442026774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,16,1,power_law_1.01,0.41030402183532716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,16,1,power_law_1.01,0.4128960132598877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,16,1,power_law_1.2,0.40869760513305664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,16,1,power_law_1.2,0.41437439918518065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,2,1,balanced,2.4578827222188315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,2,1,balanced,2.5356213251749673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,2,1,power_law_1.01,2.4606847763061523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,2,1,power_law_1.01,2.4637184143066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,2,1,power_law_1.2,2.453094482421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,2,1,power_law_1.2,2.461561584472656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,32,1,balanced,0.28090665737787884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,32,1,balanced,0.28116800387700397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,32,1,power_law_1.01,0.28707840442657473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,32,1,power_law_1.01,0.2875391960144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,32,1,power_law_1.2,0.2839296102523804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,32,1,power_law_1.2,0.28631041049957273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,4,1,balanced,1.2381920019785564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,4,1,balanced,1.247040033340454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,4,1,power_law_1.01,1.2835712432861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,4,1,power_law_1.01,1.286393642425537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,4,1,power_law_1.2,1.2830400466918945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,4,1,power_law_1.2,1.287123203277588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,8,1,balanced,0.6887040138244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,8,1,balanced,0.691706657409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,8,1,power_law_1.01,0.6939455986022949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,8,1,power_law_1.01,0.703007984161377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,8,1,power_law_1.2,0.7027584075927734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,14336,2,8,8,1,power_law_1.2,0.7041279792785644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,1,balanced,2.60809596379598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,1,balanced,2.6218239466349282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,1,power_law_1.01,2.8380672454833986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,1,power_law_1.01,2.838092803955078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,1,power_law_1.2,2.8331199645996095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,1,power_law_1.2,2.8475648880004885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,128,balanced,0.5473653475443522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,128,balanced,0.5490399996439616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,128,power_law_1.01,0.6408895969390869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,128,power_law_1.01,0.6588863849639892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,128,power_law_1.2,0.7080128192901611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,128,power_law_1.2,0.7314367771148682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,16,balanced,0.660154660542806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,16,balanced,0.6618133385976156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,16,power_law_1.01,0.8089216232299805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,16,power_law_1.01,0.8417728424072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,16,power_law_1.2,0.8806591987609863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,16,power_law_1.2,0.8918144226074218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,2,balanced,1.5524266560872395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,2,balanced,1.5763840675354004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,2,power_law_1.01,1.792083168029785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,2,power_law_1.01,1.8513919830322265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,2,power_law_1.2,1.8796863555908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,2,power_law_1.2,1.9018112182617188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,32,balanced,0.593450665473938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,32,balanced,0.595418651898702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,32,power_law_1.01,0.7429247856140136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,32,power_law_1.01,0.7456384181976319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,32,power_law_1.2,0.7833471775054932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,32,power_law_1.2,0.7842559814453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,4,balanced,1.0486453374226887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,4,balanced,1.0510079860687256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,4,power_law_1.01,1.2404735565185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,4,power_law_1.01,1.272531223297119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,4,power_law_1.2,1.2995008468627929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,4,power_law_1.2,1.3965567588806151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,64,balanced,0.562112013498942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,64,balanced,0.564736008644104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,64,power_law_1.01,0.6708288192749023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,64,power_law_1.01,0.6923200130462647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,64,power_law_1.2,0.7477824211120605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,64,power_law_1.2,0.7498303890228272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,8,balanced,0.7876693407694498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,8,balanced,0.7910613218943278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,8,power_law_1.01,0.9753087997436524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,8,power_law_1.01,0.9808704376220703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,8,power_law_1.2,1.0940735816955567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,1,8,power_law_1.2,1.1304639816284179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,16,1,balanced,0.5760533412297567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,16,1,balanced,0.576912005742391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,16,1,power_law_1.01,0.6460671901702881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,16,1,power_law_1.01,0.6476928234100342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,16,1,power_law_1.2,0.6488704204559326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,16,1,power_law_1.2,0.6507904052734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,2,1,balanced,1.395242691040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,2,1,balanced,1.4089600245157878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,2,1,power_law_1.01,1.4889151573181152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,2,1,power_law_1.01,1.5187135696411134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,2,1,power_law_1.2,1.5088000297546387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,2,1,power_law_1.2,1.525228786468506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,32,1,balanced,0.5058346589406332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,32,1,balanced,0.5086933374404907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,32,1,power_law_1.01,0.5450687885284424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,32,1,power_law_1.01,0.5455423831939697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,32,1,power_law_1.2,0.5475264072418213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,32,1,power_law_1.2,0.5478911876678467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,4,1,balanced,0.9228106339772543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,4,1,balanced,0.9265493551890055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,4,1,power_law_1.01,1.024403190612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,4,1,power_law_1.01,1.0293184280395509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,4,1,power_law_1.2,1.0376959800720216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,4,1,power_law_1.2,1.0377535820007324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,8,1,balanced,0.6665759881337484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,8,1,balanced,0.6669759750366211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,8,1,power_law_1.01,0.7388735771179199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,8,1,power_law_1.01,0.7391808032989502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,8,1,power_law_1.2,0.7411456108093262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,1536,8,128,8,1,power_law_1.2,0.7459199905395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,1,balanced,17.41852315266927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,1,balanced,18.045333862304688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,1,power_law_1.01,16.3732421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,1,power_law_1.01,16.437965393066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,1,power_law_1.2,16.708384704589843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,1,power_law_1.2,16.784474182128907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,128,balanced,1.9951252937316895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,128,balanced,1.9956426620483398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,128,power_law_1.01,2.182912063598633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,128,power_law_1.01,2.1895360946655273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,128,power_law_1.2,2.310073661804199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,128,power_law_1.2,2.3374271392822266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,16,balanced,2.749535878499349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,16,balanced,2.7570346196492515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,16,power_law_1.01,3.034636878967285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,16,power_law_1.01,3.0522176742553713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,16,power_law_1.2,3.06176643371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,16,power_law_1.2,3.1790464401245115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,2,balanced,9.68933359781901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,2,balanced,9.784255981445312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,2,power_law_1.01,9.325804901123046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,2,power_law_1.01,9.33587188720703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,2,power_law_1.2,9.673312377929687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,2,power_law_1.2,9.694579315185546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,256,balanced,1.9402507146199544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,256,balanced,1.9430079460144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,256,power_law_1.01,2.1029247283935546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,256,power_law_1.01,2.126688003540039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,256,power_law_1.2,2.227859115600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,256,power_law_1.2,2.2571840286254883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,32,balanced,2.3189013799031577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,32,balanced,2.322101275126139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,32,power_law_1.01,2.5526144027709963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,32,power_law_1.01,2.608492851257324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,32,power_law_1.2,2.692736053466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,32,power_law_1.2,2.795737648010254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,4,balanced,5.54531733194987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,4,balanced,5.565039952596028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,4,power_law_1.01,5.719750213623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,4,power_law_1.01,5.7242431640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,4,power_law_1.2,5.831238555908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,4,power_law_1.2,5.9643199920654295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,64,balanced,2.1053172747294107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,64,balanced,2.1061973571777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,64,power_law_1.01,2.328691291809082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,64,power_law_1.01,2.338252830505371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,64,power_law_1.2,2.413702392578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,64,power_law_1.2,2.419411277770996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,8,balanced,3.630885442097982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,8,balanced,3.635295867919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,8,power_law_1.01,3.6925823211669924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,8,power_law_1.01,3.8319232940673826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,8,power_law_1.2,3.9631744384765626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,1,8,power_law_1.2,4.131065750122071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,16,1,balanced,4.965445200602214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,16,1,balanced,4.966848055521647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,16,1,power_law_1.01,4.655744171142578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,16,1,power_law_1.01,4.659667205810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,16,1,power_law_1.2,4.729817581176758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,16,1,power_law_1.2,4.737120056152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,2,1,balanced,7.820506413777669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,2,1,balanced,8.002442677815756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,2,1,power_law_1.01,7.6781059265136715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,2,1,power_law_1.01,7.862188720703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,2,1,power_law_1.2,7.995219421386719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,2,1,power_law_1.2,8.293766021728516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,32,1,balanced,4.356245358784993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,32,1,balanced,4.361413319905599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,32,1,power_law_1.01,4.077951812744141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,32,1,power_law_1.01,4.079411315917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,32,1,power_law_1.2,4.1559295654296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,32,1,power_law_1.2,4.171654510498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,4,1,balanced,12.789114634195963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,4,1,balanced,13.377647399902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,4,1,power_law_1.01,13.028665161132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,4,1,power_law_1.01,13.111334228515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,4,1,power_law_1.2,13.044493103027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,4,1,power_law_1.2,13.276039123535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,8,1,balanced,3.1889918645222983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,8,1,balanced,3.2474826176961265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,8,1,power_law_1.01,2.9825536727905275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,8,1,power_law_1.01,2.9947776794433594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,8,1,power_law_1.2,3.0233407974243165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,4096,2688,22,512,8,1,power_law_1.2,3.0336639404296877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,1,balanced,8.539183934529623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,1,balanced,9.355199813842773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,1,power_law_1.01,8.888460540771485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,1,power_law_1.01,8.986637115478516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,1,power_law_1.2,8.739315032958984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,1,power_law_1.2,9.120832061767578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,2,balanced,4.443168004353841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,2,balanced,4.604874610900879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,2,power_law_1.01,6.006143951416016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,2,power_law_1.01,6.074816131591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,2,power_law_1.2,6.639366149902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,2,power_law_1.2,6.769497680664062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,4,balanced,2.504202683766683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,4,balanced,2.616208076477051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,4,power_law_1.01,4.61847038269043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,4,power_law_1.01,5.165875244140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,4,power_law_1.2,4.877856063842773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,4,power_law_1.2,5.2481536865234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,8,balanced,1.574885368347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,8,balanced,1.5988160769144695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,8,power_law_1.01,4.084640121459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,8,power_law_1.01,4.248249435424805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,8,power_law_1.2,4.016780853271484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,1,8,power_law_1.2,4.1145984649658205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,16,1,balanced,0.6481279929478964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,16,1,balanced,0.6494293212890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,16,1,power_law_1.01,0.6645055770874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,16,1,power_law_1.01,0.6653567790985108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,16,1,power_law_1.2,0.6572927951812744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,16,1,power_law_1.2,0.6658559799194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,2,1,balanced,4.176735877990723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,2,1,balanced,4.3171946207682295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,2,1,power_law_1.01,4.102399826049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,2,1,power_law_1.01,4.116486358642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,2,1,power_law_1.2,4.028755187988281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,2,1,power_law_1.2,4.200172805786133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,32,1,balanced,0.4118826786677043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,32,1,balanced,0.41516268253326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,32,1,power_law_1.01,0.4213119983673096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,32,1,power_law_1.01,0.4227456092834473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,32,1,power_law_1.2,0.4235392093658447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,32,1,power_law_1.2,0.4260735988616943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,4,1,balanced,2.0884693463643393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,4,1,balanced,2.0949974060058594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,4,1,power_law_1.01,2.069958305358887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,4,1,power_law_1.01,2.08856315612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,4,1,power_law_1.2,2.09039363861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,4,1,power_law_1.2,2.1158720016479493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,8,1,balanced,1.098410685857137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,8,1,balanced,1.1244213581085205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,8,1,power_law_1.01,1.1308480262756349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,8,1,power_law_1.01,1.14202880859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,8,1,power_law_1.2,1.1321727752685546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,16384,2,8,8,1,power_law_1.2,1.1382335662841796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,1,balanced,6.645989100138347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,1,balanced,7.583311716715495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,1,power_law_1.01,7.365586853027343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,1,power_law_1.01,7.503526306152343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,1,power_law_1.2,7.132537841796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,1,power_law_1.2,7.418540954589844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,128,balanced,0.8278773625691732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,128,balanced,0.8302880128224691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,128,power_law_1.01,0.9568960189819335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,128,power_law_1.01,0.989459228515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,128,power_law_1.2,1.053286361694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,128,power_law_1.2,1.0758015632629394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,16,balanced,1.129578669865926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,16,balanced,1.1335466702779133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,16,power_law_1.01,1.2918784141540527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,16,power_law_1.01,1.335968017578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,16,power_law_1.2,1.381004810333252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,16,power_law_1.2,1.466374397277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,2,balanced,3.8374560674031577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,2,balanced,4.024282773335774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,2,power_law_1.01,4.08581771850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,2,power_law_1.01,4.2031806945800785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,2,power_law_1.2,4.212985610961914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,2,power_law_1.2,4.3009601593017575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,256,balanced,0.8123573462168375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,256,balanced,0.8156479994455973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,256,power_law_1.01,0.9102527618408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,256,power_law_1.01,0.910540771484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,256,power_law_1.2,1.0027135848999023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,256,power_law_1.2,1.025875186920166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,32,balanced,0.9596160252888998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,32,balanced,0.9598720073699951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,32,power_law_1.01,1.1232640266418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,32,power_law_1.01,1.1605759620666505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,32,power_law_1.2,1.218284797668457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,32,power_law_1.2,1.2538368225097656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,4,balanced,2.1706239382425943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,4,balanced,2.204213301340739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,4,power_law_1.01,2.4726015090942384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,4,power_law_1.01,2.492223930358887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,4,power_law_1.2,2.5440319061279295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,4,power_law_1.2,2.670547294616699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,64,balanced,0.8756906986236572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,64,balanced,0.8766613006591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,64,power_law_1.01,0.9981247901916503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,64,power_law_1.01,1.0363391876220702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,64,power_law_1.2,1.1195903778076173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,64,power_law_1.2,1.1407808303833007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,8,balanced,1.4830293655395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,8,balanced,1.4845760663350422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,8,power_law_1.01,1.7057344436645507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,8,power_law_1.01,1.7155071258544923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,8,power_law_1.2,1.8574527740478515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,1,8,power_law_1.2,1.888991928100586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,16,1,balanced,1.0032906532287598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,16,1,balanced,1.0050133069356282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,16,1,power_law_1.01,1.0423999786376954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,16,1,power_law_1.01,1.0429823875427247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,16,1,power_law_1.2,1.0566399574279786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,16,1,power_law_1.2,1.062553596496582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,2,1,balanced,3.5054454803466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,2,1,balanced,3.51311461130778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,2,1,power_law_1.01,3.640620803833008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,2,1,power_law_1.01,3.72619514465332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,2,1,power_law_1.2,3.912947082519531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,2,1,power_law_1.2,3.930815887451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,32,1,balanced,0.8292480309804281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,32,1,balanced,0.829535961151123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,32,1,power_law_1.01,0.8593536376953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,32,1,power_law_1.01,0.8629504203796386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,32,1,power_law_1.2,0.8713727951049804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,32,1,power_law_1.2,0.873100757598877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,4,1,balanced,2.013578732808431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,4,1,balanced,2.056191921234131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,4,1,power_law_1.01,2.1297088623046876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,4,1,power_law_1.01,2.146886444091797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,4,1,power_law_1.2,2.1792640686035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,4,1,power_law_1.2,2.179750442504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,8,1,balanced,1.3277493317921956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,8,1,balanced,1.3317386309305828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,8,1,power_law_1.01,1.403974437713623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,8,1,power_law_1.01,1.4079872131347657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,8,1,power_law_1.2,1.431820774078369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2048,8,256,8,1,power_law_1.2,1.4369600296020508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,1,balanced,7.7012481689453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,1,balanced,7.830394744873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,1,power_law_1.01,7.721171569824219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,1,power_law_1.01,7.858700561523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,1,power_law_1.2,7.7944892883300785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,1,power_law_1.2,7.950323486328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,16,balanced,1.194538672765096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,16,balanced,1.1984533468882244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,16,power_law_1.01,1.475046443939209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,16,power_law_1.01,1.5047360420227052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,16,power_law_1.2,1.6551935195922851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,16,power_law_1.2,1.6865215301513672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,2,balanced,4.082826614379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,2,balanced,4.432287851969401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,2,power_law_1.01,4.607353591918946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,2,power_law_1.01,4.688358306884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,2,power_law_1.2,4.393017578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,2,power_law_1.2,4.550508880615235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,32,balanced,1.0039947032928467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,32,balanced,1.0053866704305012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,32,power_law_1.01,1.2831232070922851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,32,power_law_1.01,1.3310976028442383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,32,power_law_1.2,1.3587136268615723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,32,power_law_1.2,1.520723247528076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,4,balanced,2.3779145876566568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,4,balanced,2.444416046142578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,4,power_law_1.01,2.771776008605957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,4,power_law_1.01,2.836966323852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,4,power_law_1.2,2.690912055969238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,4,power_law_1.2,2.80501766204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,8,balanced,1.5812106132507324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,8,balanced,1.5813600222269695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,8,power_law_1.01,1.8984832763671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,8,power_law_1.01,2.021945571899414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,8,power_law_1.2,2.0083776473999024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,1,8,power_law_1.2,2.1695552825927735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,16,1,balanced,1.0520213445027669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,16,1,balanced,1.0528693199157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,16,1,power_law_1.01,1.0821184158325194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,16,1,power_law_1.01,1.0856063842773438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,16,1,power_law_1.2,1.1067135810852051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,16,1,power_law_1.2,1.1092288017272949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,2,1,balanced,3.965200106302897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,2,1,balanced,4.3086293538411455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,2,1,power_law_1.01,3.815456008911133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,2,1,power_law_1.01,3.969612884521484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,2,1,power_law_1.2,3.840582275390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,2,1,power_law_1.2,3.8885440826416016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,32,1,balanced,0.9249653021494547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,32,1,balanced,0.9252106348673502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,32,1,power_law_1.01,0.9335103988647461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,32,1,power_law_1.01,0.9380800247192382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,32,1,power_law_1.2,0.9454079627990722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,32,1,power_law_1.2,0.9475071907043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,4,1,balanced,2.1727892557779946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,4,1,balanced,2.2795467376708984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,4,1,power_law_1.01,2.1740352630615236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,4,1,power_law_1.01,2.1745279312133787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,4,1,power_law_1.2,2.222777557373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,4,1,power_law_1.2,2.226291275024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,8,1,balanced,1.4026719729105632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,8,1,balanced,1.4058027267456055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,8,1,power_law_1.01,1.4077887535095215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,8,1,power_law_1.01,1.4100031852722168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,8,1,power_law_1.2,1.4161791801452637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,6144,2560,8,160,8,1,power_law_1.2,1.4193984031677247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,1,balanced,8.139823913574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,1,balanced,8.527706782023111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,1,power_law_1.01,8.366706848144531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,1,power_law_1.01,8.838086700439453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,1,power_law_1.2,8.716031646728515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,1,power_law_1.2,8.750624084472657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,128,balanced,0.9157226880391439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,128,balanced,0.9162293275197347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,128,power_law_1.01,1.0556096076965331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,128,power_law_1.01,1.0878144264221192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,128,power_law_1.2,1.1921600341796874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,128,power_law_1.2,1.2543040275573731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,16,balanced,1.264405330022176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,16,balanced,1.2676693598429363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,16,power_law_1.01,1.4896127700805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,16,power_law_1.01,1.5415743827819823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,16,power_law_1.2,1.612006378173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,16,power_law_1.2,1.6778112411499024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,2,balanced,4.3744001388549805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,2,balanced,4.493898709615071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,2,power_law_1.01,4.700735855102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,2,power_law_1.01,4.849760055541992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,2,power_law_1.2,4.926649475097657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,2,power_law_1.2,5.222451019287109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,256,balanced,0.8940587043762207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,256,balanced,0.8988107045491537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,256,power_law_1.01,1.0058560371398926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,256,power_law_1.01,1.0095744132995605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,256,power_law_1.2,1.1407103538513184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,256,power_law_1.2,1.1527104377746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,32,balanced,1.0679946740468342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,32,balanced,1.0686773459116619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,32,power_law_1.01,1.268883228302002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,32,power_law_1.01,1.2810879707336427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,32,power_law_1.2,1.3432767868041993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,32,power_law_1.2,1.3828224182128905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,4,balanced,2.5092533429463706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,4,balanced,2.5406667391459146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,4,power_law_1.01,2.828755187988281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,4,power_law_1.01,2.9284799575805662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,4,power_law_1.2,3.150649642944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,4,power_law_1.2,3.2232574462890624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,64,balanced,0.9669439792633057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,64,balanced,0.9693013032277426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,64,power_law_1.01,1.1285887718200684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,64,power_law_1.01,1.1393792152404785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,64,power_law_1.2,1.2226176261901855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,64,power_law_1.2,1.2559743881225587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,8,balanced,1.670629342397054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,8,balanced,1.6823573112487793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,8,power_law_1.01,1.901055908203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,8,power_law_1.01,1.9273408889770507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,8,power_law_1.2,2.1631359100341796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,1,8,power_law_1.2,2.211180877685547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,16,1,balanced,1.1571733156840007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,16,1,balanced,1.158725341161092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,16,1,power_law_1.01,1.1974592208862305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,16,1,power_law_1.01,1.2002943992614745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,16,1,power_law_1.2,1.2193023681640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,16,1,power_law_1.2,1.228831958770752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,2,1,balanced,4.236005465189616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,2,1,balanced,4.45249080657959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,2,1,power_law_1.01,4.4958656311035154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,2,1,power_law_1.01,4.681964874267578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,2,1,power_law_1.2,4.535193634033203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,2,1,power_law_1.2,4.539430236816406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,32,1,balanced,0.9541760285695394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,32,1,balanced,0.954965353012085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,32,1,power_law_1.01,0.9903615951538086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,32,1,power_law_1.01,0.9912063598632812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,32,1,power_law_1.2,1.0022784233093263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,32,1,power_law_1.2,1.013209629058838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,4,1,balanced,2.4627307256062827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,4,1,balanced,2.4851786295572915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,4,1,power_law_1.01,2.46313591003418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,4,1,power_law_1.01,2.5267839431762695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,4,1,power_law_1.2,2.5227519989013674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,4,1,power_law_1.2,2.5311424255371096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,8,1,balanced,1.5391146341959636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,8,1,balanced,1.5408053398132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,8,1,power_law_1.01,1.6267328262329102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,8,1,power_law_1.01,1.632748794555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,8,1,power_law_1.2,1.6507776260375977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,256,8,1,power_law_1.2,1.6534784317016602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,1,balanced,7.6947892506917315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,1,balanced,8.0403200785319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,1,power_law_1.01,10.044857788085938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,1,power_law_1.01,10.179264068603516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,1,power_law_1.2,10.49719009399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,1,power_law_1.2,10.558195495605469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,128,balanced,0.9653493563334147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,128,balanced,0.9656533400217692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,128,power_law_1.01,1.1089280128479004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,128,power_law_1.01,1.118336009979248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,128,power_law_1.2,1.1797568321228027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,128,power_law_1.2,1.204851245880127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,16,balanced,1.308181365331014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,16,balanced,1.3104106585184734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,16,power_law_1.01,1.6114240646362306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,16,power_law_1.01,1.6320575714111327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,16,power_law_1.2,1.6692096710205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,16,power_law_1.2,1.7248384475708007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,2,balanced,4.449221293131511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,2,balanced,4.450133323669434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,2,power_law_1.01,5.370912170410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,2,power_law_1.01,5.605612945556641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,2,power_law_1.2,6.013536071777343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,2,power_law_1.2,6.029830551147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,32,balanced,1.1137173175811768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,32,balanced,1.1171573003133137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,32,power_law_1.01,1.3516608238220216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,32,power_law_1.01,1.3530431747436524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,32,power_law_1.2,1.4437376022338868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,32,power_law_1.2,1.4449536323547363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,4,balanced,2.4867199261983237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,4,balanced,2.496250629425049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,4,power_law_1.01,3.1838016510009766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,4,power_law_1.01,3.2074817657470702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,4,power_law_1.2,3.3206912994384767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,4,power_law_1.2,3.4002174377441405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,64,balanced,1.0105546315511067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,64,balanced,1.0122026602427165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,64,power_law_1.01,1.1760640144348145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,64,power_law_1.01,1.1772800445556642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,64,power_law_1.2,1.2526847839355468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,64,power_law_1.2,1.306668758392334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,8,balanced,1.7078773180643718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,8,balanced,1.7150932947794597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,8,power_law_1.01,2.1329343795776365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,8,power_law_1.01,2.180486488342285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,8,power_law_1.2,2.3007551193237306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,1,8,power_law_1.2,2.342508888244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,16,1,balanced,1.1309226353963215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,16,1,balanced,1.1341066360473633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,16,1,power_law_1.01,1.3560128211975098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,16,1,power_law_1.01,1.3666367530822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,16,1,power_law_1.2,1.3886528015136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,16,1,power_law_1.2,1.38919677734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,2,1,balanced,4.134629249572754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,2,1,balanced,4.263797442118327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,2,1,power_law_1.01,5.23570556640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,2,1,power_law_1.01,5.241721725463867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,2,1,power_law_1.2,5.474771118164062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,2,1,power_law_1.2,5.5050304412841795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,32,1,balanced,0.9651626745859782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,32,1,balanced,0.9652319749196371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,32,1,power_law_1.01,1.1248512268066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,32,1,power_law_1.01,1.1317440032958985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,32,1,power_law_1.2,1.1551168441772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,32,1,power_law_1.2,1.1569855690002442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,4,1,balanced,2.321173350016276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,4,1,balanced,2.3561280568440757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,4,1,power_law_1.01,2.86297607421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,4,1,power_law_1.01,2.871481513977051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,4,1,power_law_1.2,3.0180864334106445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,4,1,power_law_1.2,3.067027282714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,8,1,balanced,1.52511994043986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,8,1,balanced,1.5291147232055664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,8,1,power_law_1.01,1.84703369140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,8,1,power_law_1.01,1.8503999710083008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,8,1,power_law_1.2,1.9251007080078124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,6144,7168,2048,8,384,8,1,power_law_1.2,1.9321727752685547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,1,balanced,0.20730666319529215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,1,balanced,0.20841066042582193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,1,power_law_1.01,0.18952319622039795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,1,power_law_1.01,0.19271039962768555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,1,power_law_1.2,0.19367680549621583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,1,power_law_1.2,0.19415040016174318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,128,balanced,0.0335359995563825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,128,balanced,0.03362133353948593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,128,power_law_1.01,0.03269760012626648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,128,power_law_1.01,0.03284479975700379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,128,power_law_1.2,0.03264000117778778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,128,power_law_1.2,0.032671999931335446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,16,balanced,0.04257600009441376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,16,balanced,0.04322666426499685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,16,power_law_1.01,0.040780800580978396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,16,power_law_1.01,0.04121600091457367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,16,power_law_1.2,0.040780800580978396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,16,power_law_1.2,0.04092159867286682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,2,balanced,0.13637866576512656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,2,balanced,0.14891200264294943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,2,power_law_1.01,0.12369920015335083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,2,power_law_1.01,0.12743040323257446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,2,power_law_1.2,0.13030400276184081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,2,power_law_1.2,0.1313472032546997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,32,balanced,0.037274666130542755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,32,balanced,0.03748266647259394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,32,power_law_1.01,0.0348800003528595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,32,power_law_1.01,0.03493120074272156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,32,power_law_1.2,0.035174399614334106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,32,power_law_1.2,0.035417601466178894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,4,balanced,0.08895466725031535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,4,balanced,0.09156266848246257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,4,power_law_1.01,0.08150399923324585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,4,power_law_1.01,0.08239359855651855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,4,power_law_1.2,0.0851967990398407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,4,power_law_1.2,0.08723840117454529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,64,balanced,0.03533866753180822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,64,balanced,0.03579733272393545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,64,power_law_1.01,0.033190399408340454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,64,power_law_1.01,0.03322240114212036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,64,power_law_1.2,0.03314560055732727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,64,power_law_1.2,0.033471998572349546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,8,balanced,0.05758399764696757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,8,balanced,0.05903466542561849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,8,power_law_1.01,0.05324159860610962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,8,power_law_1.01,0.05633919835090637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,8,power_law_1.2,0.055129599571228025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,1,8,power_law_1.2,0.055212801694869994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,2,1,balanced,0.13964266578356424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,2,1,balanced,0.14071466525395712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,2,1,power_law_1.01,0.12698240280151368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,2,1,power_law_1.01,0.13013119697570802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,2,1,power_law_1.2,0.13218560218811035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,2,1,power_law_1.2,0.13303040266036986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,4,1,balanced,0.09991466999053955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,4,1,balanced,0.10121599833170573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,4,1,power_law_1.01,0.09499520063400269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,4,1,power_law_1.01,0.09608319997787476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,4,1,power_law_1.2,0.09393919706344604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2048,768,8,128,4,1,power_law_1.2,0.09477120041847228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,1,balanced,0.5816426674524943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,1,balanced,0.5834399859110514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,1,power_law_1.01,0.48430719375610354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,1,power_law_1.01,0.49912319183349607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,1,power_law_1.2,0.49109759330749514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,1,power_law_1.2,0.4971776008605957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,128,balanced,0.040661332507928215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,128,balanced,0.04139200101296107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,128,power_law_1.01,0.03991680145263672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,128,power_law_1.01,0.040294399857521056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,128,power_law_1.2,0.04023039937019348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,128,power_law_1.2,0.04028800129890442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,16,balanced,0.07376533250013988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,16,balanced,0.07429333527882893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,16,power_law_1.01,0.07094399929046631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,16,power_law_1.01,0.07139840126037597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,16,power_law_1.2,0.07036799788475037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,16,power_law_1.2,0.0710528016090393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,2,balanced,0.34020264943440753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,2,balanced,0.3403306802113851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,2,power_law_1.01,0.2910847902297974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,2,power_law_1.01,0.29764480590820314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,2,power_law_1.2,0.29351680278778075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,2,power_law_1.2,0.29454081058502196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,32,balanced,0.05816000203291575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,32,balanced,0.05829866727193197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,32,power_law_1.01,0.05594879984855652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,32,power_law_1.01,0.05614719986915588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,32,power_law_1.2,0.055244797468185426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,32,power_law_1.2,0.0565887987613678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,4,balanced,0.19795199235280356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,4,balanced,0.199455996354421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,4,power_law_1.01,0.1660863995552063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,4,power_law_1.01,0.17601280212402343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,4,power_law_1.2,0.17010560035705566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,4,power_law_1.2,0.17162879705429077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,64,balanced,0.04643733302752177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,64,balanced,0.04656533400217692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,64,power_law_1.01,0.04538240134716034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,64,power_law_1.01,0.04542079865932465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,64,power_law_1.2,0.045203199982643126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,64,power_law_1.2,0.04520959854125976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,8,balanced,0.12297067046165466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,8,balanced,0.12308800220489502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,8,power_law_1.01,0.10852479934692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,8,power_law_1.01,0.11336959600448608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,8,power_law_1.2,0.11272319555282592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,1,8,power_law_1.2,0.11653120517730713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,16,1,balanced,0.2372586727142334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,16,1,balanced,0.2377013365427653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,16,1,power_law_1.01,0.2017728090286255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,16,1,power_law_1.01,0.2059391975402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,16,1,power_law_1.2,0.19946880340576173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,16,1,power_law_1.2,0.20071039199829102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,2,1,balanced,0.3466346661249797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,2,1,balanced,0.34698132673899335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,2,1,power_law_1.01,0.29149439334869387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,2,1,power_law_1.01,0.29159040451049806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,2,1,power_law_1.2,0.2883647918701172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,2,1,power_law_1.2,0.29955201148986815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,32,1,balanced,0.22224533557891846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,32,1,balanced,0.22429333130518594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,32,1,power_law_1.01,0.18680319786071778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,32,1,power_law_1.01,0.18979840278625487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,32,1,power_law_1.2,0.18946559429168702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,32,1,power_law_1.2,0.19233920574188232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,4,1,balanced,0.20756266514460245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,4,1,balanced,0.20890132586161295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,4,1,power_law_1.01,0.17482240200042726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,4,1,power_law_1.01,0.17484159469604493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,4,1,power_law_1.2,0.17450239658355712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,4,1,power_law_1.2,0.17681920528411865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,8,1,balanced,0.3086880048116048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,8,1,balanced,0.30877866347630817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,8,1,power_law_1.01,0.26975359916687014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,8,1,power_law_1.01,0.27068800926208497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,8,1,power_law_1.2,0.2645951986312866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,2688,1856,6,128,8,1,power_law_1.2,0.26749439239501954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,1,balanced,1.1079359849294026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,1,balanced,1.1092747052510579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,1,power_law_1.01,0.8407360076904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,1,power_law_1.01,0.8495871543884277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,1,power_law_1.2,0.8157183647155761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,1,power_law_1.2,0.8387711524963379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,128,balanced,0.04580266773700714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,128,balanced,0.045850664377212524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,128,power_law_1.01,0.04483200013637543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,128,power_law_1.01,0.04492799937725067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,128,power_law_1.2,0.04519039988517761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,128,power_law_1.2,0.04578559994697571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,16,balanced,0.1209440032641093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,16,balanced,0.12186666329701741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,16,power_law_1.01,0.10825599431991577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,16,power_law_1.01,0.11119359731674194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,16,power_law_1.2,0.10057599544525146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,16,power_law_1.2,0.10664960145950317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,2,balanced,0.5794933239618937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,2,balanced,0.5798933506011963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,2,power_law_1.01,0.4648767948150635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,2,power_law_1.01,0.47416319847106936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,2,power_law_1.2,0.46202239990234373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,2,power_law_1.2,0.46832637786865233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,256,balanced,0.04387199878692627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,256,balanced,0.045647998650868736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,256,power_law_1.01,0.042982399463653564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,256,power_law_1.01,0.04310399889945984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,256,power_law_1.2,0.04320000112056732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,256,power_law_1.2,0.04336000084877014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,32,balanced,0.07644266883532207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,32,balanced,0.07644799848397572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,32,power_law_1.01,0.07029119729995728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,32,power_law_1.01,0.07257599830627441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,32,power_law_1.2,0.06848639845848084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,32,power_law_1.2,0.06970880031585694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,4,balanced,0.3164373238881429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,4,balanced,0.32438933849334717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,4,power_law_1.01,0.2620543956756592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,4,power_law_1.01,0.2752255916595459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,4,power_law_1.2,0.24273281097412108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,4,power_law_1.2,0.26753280162811277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,64,balanced,0.05821866790453593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,64,balanced,0.058549334605534874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,64,power_law_1.01,0.05414400100708008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,64,power_law_1.01,0.056857597827911374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,64,power_law_1.2,0.05491200089454651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,64,power_law_1.2,0.05495039820671081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,8,balanced,0.18449066082636514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,8,balanced,0.18453333775202432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,8,power_law_1.01,0.15890560150146485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,8,power_law_1.01,0.16666879653930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,8,power_law_1.2,0.14947199821472168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,1,8,power_law_1.2,0.17053439617156982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,16,1,balanced,0.16766933600107828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,16,1,balanced,0.16800532738367716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,16,1,power_law_1.01,0.12519680261611937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,16,1,power_law_1.01,0.12726399898529053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,16,1,power_law_1.2,0.11752959489822387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,16,1,power_law_1.2,0.1205888032913208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,2,1,balanced,0.5859573284784952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,2,1,balanced,0.593946655591329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,2,1,power_law_1.01,0.44185600280761717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,2,1,power_law_1.01,0.45669121742248536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,2,1,power_law_1.2,0.4393919944763184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,2,1,power_law_1.2,0.4412992000579834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,32,1,balanced,0.13481066624323526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,32,1,balanced,0.13525333007176718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,32,1,power_law_1.01,0.10940799713134766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,32,1,power_law_1.01,0.10972800254821777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,32,1,power_law_1.2,0.10760320425033569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,32,1,power_law_1.2,0.10795520544052124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,4,1,balanced,0.3403466542561849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,4,1,balanced,0.3410559892654419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,4,1,power_law_1.01,0.2575103998184204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,4,1,power_law_1.01,0.2595263957977295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,4,1,power_law_1.2,0.2543231964111328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,4,1,power_law_1.2,0.2612096071243286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,8,1,balanced,0.22542933622996011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,8,1,balanced,0.22744532426198324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,8,1,power_law_1.01,0.17059199810028075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,8,1,power_law_1.01,0.1800384044647217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,8,1,power_law_1.2,0.17244160175323486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,3072,1536,8,256,8,1,power_law_1.2,0.17526400089263916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,1,balanced,0.4647413492202759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,1,balanced,0.4651840130488078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,1,power_law_1.01,0.5000832080841064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,1,power_law_1.01,0.5173056125640869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,1,power_law_1.2,0.5037055969238281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,1,power_law_1.2,0.5329855918884278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,2,balanced,0.2856373389561971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,2,balanced,0.2874400019645691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,2,power_law_1.01,0.3195264101028442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,2,power_law_1.01,0.33164799213409424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,2,power_law_1.2,0.3029952049255371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,2,power_law_1.2,0.30675840377807617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,4,balanced,0.19117865959803262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,4,balanced,0.20118399461110434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,4,power_law_1.01,0.22491519451141356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,4,power_law_1.01,0.23461759090423584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,4,power_law_1.2,0.2251584053039551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,4,power_law_1.2,0.23141119480133057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,8,balanced,0.13570666313171387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,8,balanced,0.1379146675268809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,8,power_law_1.01,0.17882879972457885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,8,power_law_1.01,0.18225280046463013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,8,power_law_1.2,0.17089279890060424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,1,8,power_law_1.2,0.18049919605255127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,16,1,balanced,0.0584853341182073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,16,1,balanced,0.060032000144322716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,16,1,power_law_1.01,0.062118399143219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,16,1,power_law_1.01,0.06812800168991089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,16,1,power_law_1.2,0.05974400043487549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,16,1,power_law_1.2,0.06381440162658691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,2,1,balanced,0.2513386607170105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,2,1,balanced,0.25547732909520465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,2,1,power_law_1.01,0.2613823890686035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,2,1,power_law_1.01,0.2717056035995483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,2,1,power_law_1.2,0.2793920040130615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,2,1,power_law_1.2,0.2804608106613159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,32,1,balanced,0.045519997676213585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,32,1,balanced,0.04751466711362203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,32,1,power_law_1.01,0.044588801264762876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,32,1,power_law_1.01,0.04624640047550201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,32,1,power_law_1.2,0.04583039879798889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,32,1,power_law_1.2,0.04652160108089447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,4,1,balanced,0.1458293298880259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,4,1,balanced,0.14917866388956705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,4,1,power_law_1.01,0.14421119689941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,4,1,power_law_1.01,0.15126399993896483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,4,1,power_law_1.2,0.14565119743347169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,4,1,power_law_1.2,0.15181440114974976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,8,1,balanced,0.09693333506584167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,8,1,balanced,0.09795733292897542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,8,1,power_law_1.01,0.08472959995269776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,8,1,power_law_1.01,0.08542720079421998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,8,1,power_law_1.2,0.08427519798278808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,14336,2,8,8,1,power_law_1.2,0.0877120018005371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,1,balanced,0.7616639931996664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,1,balanced,0.7659839789072672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,1,power_law_1.01,0.689631986618042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,1,power_law_1.01,0.7021759986877442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,1,power_law_1.2,0.7015232086181641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,1,power_law_1.2,0.7123007774353027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,128,balanced,0.04584533472855886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,128,balanced,0.04597333570321401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,128,power_law_1.01,0.045491200685501096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,128,power_law_1.01,0.04552319943904877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,128,power_law_1.2,0.04565120041370392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,128,power_law_1.2,0.04601599872112274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,16,balanced,0.090421328941981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,16,balanced,0.09064533313115437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,16,power_law_1.01,0.08340479731559754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,16,power_law_1.01,0.08819199800491333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,16,power_law_1.2,0.08564479947090149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,16,power_law_1.2,0.08598399758338929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,2,balanced,0.41419732570648193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,2,balanced,0.41606398423512775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,2,power_law_1.01,0.3749759912490845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,2,power_law_1.01,0.37528960704803466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,2,power_law_1.2,0.3743423938751221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,2,power_law_1.2,0.392524790763855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,32,balanced,0.06604800124963124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,32,balanced,0.06791466474533081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,32,power_law_1.01,0.06584320068359376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,32,power_law_1.01,0.06606720089912414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,32,power_law_1.2,0.06469759941101075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,32,power_law_1.2,0.06557440161705017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,4,balanced,0.23271467288335165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,4,balanced,0.23559466997782388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,4,power_law_1.01,0.22305920124053955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,4,power_law_1.01,0.2232448101043701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,4,power_law_1.2,0.21633920669555665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,4,power_law_1.2,0.22618238925933837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,64,balanced,0.05198400219281515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,64,balanced,0.05382933219273885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,64,power_law_1.01,0.04924159944057464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,64,power_law_1.01,0.049779200553894044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,64,power_law_1.2,0.05025920271873474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,64,power_law_1.2,0.05289599895477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,8,balanced,0.1456160048643748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,8,balanced,0.15082666277885437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,8,power_law_1.01,0.13880959749221802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,8,power_law_1.01,0.1443711996078491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,8,power_law_1.2,0.14097280502319337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,1,8,power_law_1.2,0.14375679492950438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,16,1,balanced,0.11521599690119426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,16,1,balanced,0.11539733409881592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,16,1,power_law_1.01,0.10582400560379028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,16,1,power_law_1.01,0.10704640150070191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,16,1,power_law_1.2,0.10743680000305175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,16,1,power_law_1.2,0.11052160263061524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,2,1,balanced,0.38656000296274823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,2,1,balanced,0.38845332463582355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,2,1,power_law_1.01,0.342630410194397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,2,1,power_law_1.01,0.34652159214019773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,2,1,power_law_1.2,0.3539328098297119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,2,1,power_law_1.2,0.35540480613708497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,32,1,balanced,0.10292266805966695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,32,1,balanced,0.1032960017522176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,32,1,power_law_1.01,0.09581440091133117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,32,1,power_law_1.01,0.09648000001907349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,32,1,power_law_1.2,0.09639040231704712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,32,1,power_law_1.2,0.0981760025024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,4,1,balanced,0.24450133244196573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,4,1,balanced,0.24490666389465332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,4,1,power_law_1.01,0.23180160522460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,4,1,power_law_1.01,0.23182079792022706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,4,1,power_law_1.2,0.23179519176483154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,4,1,power_law_1.2,0.2382591962814331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,8,1,balanced,0.17324799299240112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,8,1,balanced,0.17561600605646768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,8,1,power_law_1.01,0.1577855944633484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,8,1,power_law_1.01,0.1607743978500366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,8,1,power_law_1.2,0.15982719659805297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,1536,8,128,8,1,power_law_1.2,0.16530560255050658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,1,balanced,5.257877349853516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,1,balanced,5.3393815358479815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,1,power_law_1.01,4.090643310546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,1,power_law_1.01,4.2209217071533205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,1,power_law_1.2,4.123455810546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,1,power_law_1.2,4.282745742797852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,128,balanced,0.11934933066368103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,128,balanced,0.12177067001660664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,128,power_law_1.01,0.11891839504241944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,128,power_law_1.01,0.11909760236740112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,128,power_law_1.2,0.11875200271606445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,128,power_law_1.2,0.11968640089035035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,16,balanced,0.39795732498168945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,16,balanced,0.39952532450358075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,16,power_law_1.01,0.356710410118103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,16,power_law_1.01,0.36469759941101076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,16,power_law_1.2,0.3621376037597656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,16,power_law_1.2,0.3785343885421753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,2,balanced,2.5592800776163735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,2,balanced,2.718384106953939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,2,power_law_1.01,2.0715328216552735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,2,power_law_1.01,2.1760704040527346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,2,power_law_1.2,2.102124786376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,2,power_law_1.2,2.160038375854492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,256,balanced,0.1018453339735667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,256,balanced,0.10310399532318115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,256,power_law_1.01,0.10005120038986207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,256,power_law_1.01,0.1000704050064087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,256,power_law_1.2,0.10043519735336304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,256,power_law_1.2,0.10063999891281128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,32,balanced,0.2464746634165446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,32,balanced,0.2480693260828654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,32,power_law_1.01,0.22328319549560546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,32,power_law_1.01,0.22707200050354004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,32,power_law_1.2,0.22651519775390624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,32,power_law_1.2,0.23096320629119874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,4,balanced,1.3068532943725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,4,balanced,1.3102773030598958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,4,power_law_1.01,1.173145580291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,4,power_law_1.01,1.2210880279541017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,4,power_law_1.2,1.1136832237243652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,4,power_law_1.2,1.1416319847106933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,64,balanced,0.16977600256601968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,64,balanced,0.17299199104309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,64,power_law_1.01,0.1518272042274475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,64,power_law_1.01,0.15453439950942993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,64,power_law_1.2,0.16090240478515624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,64,power_law_1.2,0.16510080099105834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,8,balanced,0.7072479724884033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,8,power_law_1.01,0.626803207397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,8,power_law_1.01,0.6395135879516601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,8,power_law_1.2,0.6122176170349121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,1,8,power_law_1.2,0.6148032188415528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,16,1,balanced,1.5757652918497722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,16,1,balanced,1.5768639246622722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,16,1,power_law_1.01,1.2980095863342285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,16,1,power_law_1.01,1.3158271789550782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,16,1,power_law_1.2,1.290988826751709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,16,1,power_law_1.2,1.2991935729980468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,2,1,balanced,2.445669333140055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,2,1,balanced,2.451493263244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,2,1,power_law_1.01,2.025587272644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,2,1,power_law_1.01,2.025823974609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,2,1,power_law_1.2,1.9798463821411132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,2,1,power_law_1.2,2.0091968536376954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,32,1,balanced,1.2682507038116455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,32,1,balanced,1.271114667256673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,32,1,power_law_1.01,1.0455167770385743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,32,1,power_law_1.01,1.0568256378173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,32,1,power_law_1.2,1.0435903549194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,32,1,power_law_1.2,1.0476479530334473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,4,1,balanced,1.3910667101542156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,4,1,balanced,1.392800013224284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,4,1,power_law_1.01,1.1542719841003417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,4,1,power_law_1.01,1.1711104393005372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,4,1,power_law_1.2,1.1548095703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,4,1,power_law_1.2,1.1695167541503906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,8,1,balanced,0.8010559876759847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,8,1,balanced,0.8012426694234213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,8,1,power_law_1.01,0.6636159896850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,8,1,power_law_1.01,0.6737088203430176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,8,1,power_law_1.2,0.6542912006378174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,4096,2688,22,512,8,1,power_law_1.2,0.6631231784820557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,1,balanced,0.7977173328399658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,1,balanced,0.8008533318837484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,1,power_law_1.01,0.8359359741210938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,1,power_law_1.01,0.9013504028320313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,1,power_law_1.2,0.8417920112609864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,1,power_law_1.2,0.8585280418395996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,2,balanced,0.4380106528600057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,2,balanced,0.46264533201853436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,2,power_law_1.01,0.4843776226043701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,2,power_law_1.01,0.4891647815704346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,2,power_law_1.2,0.4966720104217529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,2,power_law_1.2,0.5114751815795898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,4,balanced,0.2488266626993815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,4,balanced,0.2512906591097514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,4,power_law_1.01,0.3268480062484741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,4,power_law_1.01,0.34344959259033203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,4,power_law_1.2,0.31048319339752195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,4,power_law_1.2,0.38517758846282957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,8,balanced,0.16851733128229776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,8,balanced,0.17076265811920166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,8,power_law_1.01,0.2348543882369995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,8,power_law_1.01,0.23571200370788575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,8,power_law_1.2,0.23619840145111085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,1,8,power_law_1.2,0.237555193901062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,16,1,balanced,0.08370133241017659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,16,1,balanced,0.08396800359090169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,16,1,power_law_1.01,0.08398720026016235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,16,1,power_law_1.01,0.09159039855003356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,16,1,power_law_1.2,0.08867200016975403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,16,1,power_law_1.2,0.09021440148353577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,2,1,balanced,0.43093331654866535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,2,1,balanced,0.4466773271560669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,2,1,power_law_1.01,0.450867223739624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,2,1,power_law_1.01,0.45235838890075686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,2,1,power_law_1.2,0.43934078216552735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,2,1,power_law_1.2,0.44911999702453614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,32,1,balanced,0.06471999982992808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,32,1,balanced,0.06613333523273468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,32,1,power_law_1.01,0.06478080153465271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,32,1,power_law_1.01,0.06828799843788147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,32,1,power_law_1.2,0.0646016001701355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,32,1,power_law_1.2,0.06787199974060058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,4,1,balanced,0.2315839926401774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,4,1,balanced,0.2472533384958903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,4,1,power_law_1.01,0.23125760555267333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,4,1,power_law_1.01,0.24637439250946044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,4,1,power_law_1.2,0.23047680854797364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,4,1,power_law_1.2,0.2425407886505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,8,1,balanced,0.12779733538627625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,8,1,balanced,0.1421440045038859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,8,1,power_law_1.01,0.13415679931640626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,8,1,power_law_1.01,0.13778560161590575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,8,1,power_law_1.2,0.1410048007965088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,16384,2,8,8,1,power_law_1.2,0.14165760278701783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,1,balanced,2.8258934020996094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,1,balanced,3.0172106424967446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,1,power_law_1.01,2.1227840423583983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,1,power_law_1.01,2.13177604675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,1,power_law_1.2,2.1081472396850587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,1,power_law_1.2,2.144281578063965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,128,balanced,0.086709330479304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,128,balanced,0.08708266417185466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,128,power_law_1.01,0.0843775987625122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,128,power_law_1.01,0.08499199748039246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,128,power_law_1.2,0.08458240032196045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,128,power_law_1.2,0.08463360071182251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,16,balanced,0.23373866081237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,16,balanced,0.23388266563415527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,16,power_law_1.01,0.21763839721679687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,16,power_law_1.01,0.22243199348449708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,16,power_law_1.2,0.22492799758911133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,16,power_law_1.2,0.22939519882202147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,2,balanced,1.4316587448120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,2,balanced,1.4762773513793945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,2,power_law_1.01,1.116102409362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,2,power_law_1.01,1.184774398803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,2,power_law_1.2,1.0810751914978027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,2,power_law_1.2,1.0811200141906738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,256,balanced,0.07032000025113423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,256,balanced,0.07344533503055573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,256,power_law_1.01,0.06941440105438232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,256,power_law_1.01,0.07151359915733338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,256,power_law_1.2,0.06937599778175355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,256,power_law_1.2,0.07109119892120361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,32,balanced,0.1402186652024587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,32,balanced,0.141594668229421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,32,power_law_1.01,0.13411840200424194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,32,power_law_1.01,0.1373247981071472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,32,power_law_1.2,0.13270399570465088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,32,power_law_1.2,0.1346943974494934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,4,balanced,0.74507737159729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,4,balanced,0.7465013662974039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,4,power_law_1.01,0.6222271919250488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,4,power_law_1.01,0.6601791858673096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,4,power_law_1.2,0.6362815856933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,4,power_law_1.2,0.6888448238372803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,64,balanced,0.10528533657391866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,64,balanced,0.10717866818110149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,64,power_law_1.01,0.10102399587631225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,64,power_law_1.01,0.10346239805221558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,64,power_law_1.2,0.09467520117759705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,64,power_law_1.2,0.10359679460525513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,8,balanced,0.42128535111745197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,8,balanced,0.4243786732355754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,8,power_law_1.01,0.36535680294036865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,8,power_law_1.01,0.37608320713043214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,8,power_law_1.2,0.32058238983154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,1,8,power_law_1.2,0.38670079708099364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,16,1,balanced,0.3098026712735494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,16,1,balanced,0.31016000111897785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,16,1,power_law_1.01,0.26229760646820066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,16,1,power_law_1.01,0.26302080154418944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,16,1,power_law_1.2,0.2584575891494751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,16,1,power_law_1.2,0.26023039817810056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,2,1,balanced,1.4581440289815266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,2,1,balanced,1.4907946586608887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,2,1,power_law_1.01,1.1227840423583983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,2,1,power_law_1.01,1.141932773590088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,2,1,power_law_1.2,1.071833610534668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,2,1,power_law_1.2,1.103872013092041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,32,1,balanced,0.24407466252644858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,32,1,balanced,0.24566400051116943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,32,1,power_law_1.01,0.19243520498275757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,32,1,power_law_1.01,0.19684480428695678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,32,1,power_law_1.2,0.1922943949699402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,32,1,power_law_1.2,0.19281280040740967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,4,1,balanced,0.7783892949422201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,4,1,balanced,0.779151995976766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,4,1,power_law_1.01,0.6108416080474853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,4,1,power_law_1.01,0.6240896224975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,4,1,power_law_1.2,0.5913280010223388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,4,1,power_law_1.2,0.5934656143188477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,8,1,balanced,0.4804106553395589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,8,1,balanced,0.4816853205362956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,8,1,power_law_1.01,0.36688640117645266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,8,1,power_law_1.01,0.37036159038543703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,8,1,power_law_1.2,0.3667007923126221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2048,8,256,8,1,power_law_1.2,0.368889594078064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,1,balanced,2.2314720153808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,1,balanced,2.236117362976074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,1,power_law_1.01,1.8734912872314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,1,power_law_1.01,1.9252992630004884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,1,power_law_1.2,1.8815807342529296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,1,power_law_1.2,1.9113664627075195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,16,balanced,0.20196799437204996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,16,balanced,0.20850666364034018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,16,power_law_1.01,0.19434239864349365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,16,power_law_1.01,0.1982591986656189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,16,power_law_1.2,0.18455679416656495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,16,power_law_1.2,0.18932479619979858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,2,balanced,1.1312426726023357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,2,balanced,1.1314079761505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,2,power_law_1.01,0.9697471618652344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,2,power_law_1.01,0.9850560188293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,2,power_law_1.2,0.9520319938659668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,2,power_law_1.2,0.9983936309814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,32,balanced,0.121888001759847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,32,balanced,0.1222773293654124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,32,power_law_1.01,0.1130687952041626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,32,power_law_1.01,0.11679999828338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,32,power_law_1.2,0.11715840101242066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,32,power_law_1.2,0.11719679832458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,4,balanced,0.6112106641133627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,4,balanced,0.6145386695861816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,4,power_law_1.01,0.514470386505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,4,power_law_1.01,0.5346240043640137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,4,power_law_1.2,0.5417920112609863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,4,power_law_1.2,0.5445888042449951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,8,balanced,0.3313759962717692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,8,balanced,0.3320266604423523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,8,power_law_1.01,0.304582405090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,8,power_law_1.01,0.3088128089904785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,8,power_law_1.2,0.30531840324401854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,1,8,power_law_1.2,0.3090559959411621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,16,1,balanced,0.277349332968394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,16,1,balanced,0.2797759970029195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,16,1,power_law_1.01,0.24179840087890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,16,1,power_law_1.01,0.2439039945602417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,16,1,power_law_1.2,0.2462912082672119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,16,1,power_law_1.2,0.2465343952178955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,2,1,balanced,1.1325120131174724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,2,1,balanced,1.1357759634653728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,2,1,power_law_1.01,0.9564864158630371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,2,1,power_law_1.01,0.9635519981384277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,2,1,power_law_1.2,0.9873984336853028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,2,1,power_law_1.2,0.9990079879760743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,32,1,balanced,0.1844159960746765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,32,1,balanced,0.185370663801829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,32,1,power_law_1.01,0.16210559606552125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,32,1,power_law_1.01,0.16539520025253296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,32,1,power_law_1.2,0.1663807988166809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,32,1,power_law_1.2,0.16680959463119507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,4,1,balanced,0.6314186652501425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,4,1,balanced,0.6375573476155599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,4,1,power_law_1.01,0.5311679840087891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,4,1,power_law_1.01,0.5377280235290527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,4,1,power_law_1.2,0.5324927806854248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,4,1,power_law_1.2,0.5367616176605224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,8,1,balanced,0.3745493491490682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,8,1,balanced,0.37566399574279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,8,1,power_law_1.01,0.3399359941482544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,8,1,power_law_1.01,0.3418175935745239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,8,1,power_law_1.2,0.3425600051879883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,6144,2560,8,160,8,1,power_law_1.2,0.3455552101135254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,1,balanced,3.357013384501139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,1,balanced,3.3590879440307617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,1,power_law_1.01,2.462272071838379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,1,power_law_1.01,2.510406494140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,1,power_law_1.2,2.424569511413574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,1,power_law_1.2,2.465171241760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,128,balanced,0.09709333380063374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,128,balanced,0.097461332877477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,128,power_law_1.01,0.09461119771003723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,128,power_law_1.01,0.09492480158805847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,128,power_law_1.2,0.09473919868469238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,128,power_law_1.2,0.0950976014137268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,16,balanced,0.26946133375167847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,16,balanced,0.2749706705411275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,16,power_law_1.01,0.24820480346679688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,16,power_law_1.01,0.25557119846343995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,16,power_law_1.2,0.24512639045715331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,16,power_law_1.2,0.2575743913650513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,2,balanced,1.6915520032246907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,2,balanced,1.7375359535217285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,2,power_law_1.01,1.3457856178283691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,2,power_law_1.01,1.3668671607971192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,2,power_law_1.2,1.3272192001342773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,2,power_law_1.2,1.3528639793395996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,256,balanced,0.08240533371766408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,256,balanced,0.08291199803352356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,256,power_law_1.01,0.08090879917144775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,256,power_law_1.01,0.08280320167541504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,256,power_law_1.2,0.07934719920158387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,256,power_law_1.2,0.08166400194168091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,32,balanced,0.15847466389338175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,32,balanced,0.1590079963207245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,32,power_law_1.01,0.15367679595947265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,32,power_law_1.01,0.1539072036743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,32,power_law_1.2,0.15140479803085327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,32,power_law_1.2,0.15404800176620484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,4,balanced,0.8631839752197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,4,balanced,0.8645599683125814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,4,power_law_1.01,0.6855999946594238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,4,power_law_1.01,0.7351359844207763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,4,power_law_1.2,0.6914239883422851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,4,power_law_1.2,0.7371071815490723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,64,balanced,0.11994666854540507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,64,balanced,0.1213653286298116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,64,power_law_1.01,0.11479040384292602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,64,power_law_1.01,0.11728639602661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,64,power_law_1.2,0.11123839616775513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,64,power_law_1.2,0.1140671968460083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,8,balanced,0.4885760148366292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,8,balanced,0.4954933325449626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,8,power_law_1.01,0.3949631929397583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,8,power_law_1.01,0.43038082122802734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,8,power_law_1.2,0.39491839408874513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,1,8,power_law_1.2,0.42169599533081054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,16,1,balanced,0.3559573491414388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,16,1,balanced,0.3579839865366618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,16,1,power_law_1.01,0.30304000377655027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,16,1,power_law_1.01,0.30361599922180177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,16,1,power_law_1.2,0.29863040447235106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,16,1,power_law_1.2,0.3070080041885376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,2,1,balanced,1.7099253336588542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,2,1,balanced,1.736080010732015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,2,1,power_law_1.01,1.2969087600708007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,2,1,power_law_1.01,1.3171008110046387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,2,1,power_law_1.2,1.2805376052856445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,2,1,power_law_1.2,1.3147071838378905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,32,1,balanced,0.2796799937884013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,32,1,balanced,0.2815946737925212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,32,1,power_law_1.01,0.2207360029220581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,32,1,power_law_1.01,0.2219775915145874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,32,1,power_law_1.2,0.21984639167785644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,32,1,power_law_1.2,0.22724480628967286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,4,1,balanced,0.9026133219401041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,4,1,balanced,0.9182720184326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,4,1,power_law_1.01,0.7041984081268311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,4,1,power_law_1.01,0.7288000106811523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,4,1,power_law_1.2,0.7016191959381104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,4,1,power_law_1.2,0.7062784194946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,8,1,balanced,0.5581813255945841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,8,1,balanced,0.5595733324686686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,8,1,power_law_1.01,0.43079681396484376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,8,1,power_law_1.01,0.4315904140472412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,8,1,power_law_1.2,0.4255360126495361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,256,8,1,power_law_1.2,0.4276864051818848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,1,balanced,4.943338712056478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,1,balanced,5.451744079589844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,1,power_law_1.01,3.272467041015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,1,power_law_1.01,3.2843582153320314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,1,power_law_1.2,3.1883264541625977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,1,power_law_1.2,3.213292694091797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,128,balanced,0.11123200257619222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,128,balanced,0.11311999956766765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,128,power_law_1.01,0.10968320369720459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,128,power_law_1.01,0.1102336049079895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,128,power_law_1.2,0.10925439596176148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,128,power_law_1.2,0.10981760025024415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,16,balanced,0.3863786856333415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,16,balanced,0.3880639870961507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,16,power_law_1.01,0.3525248050689697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,16,power_law_1.01,0.3608128070831299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,16,power_law_1.2,0.31985280513763426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,16,power_law_1.2,0.3266495943069458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,2,balanced,2.573088010152181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,2,balanced,2.5955840746561685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,2,power_law_1.01,1.7856063842773438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,2,power_law_1.01,1.8010623931884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,2,power_law_1.2,1.7374784469604492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,2,power_law_1.2,1.7428543090820312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,32,balanced,0.24714134136835733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,32,balanced,0.24734934171040854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,32,power_law_1.01,0.21829121112823485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,32,power_law_1.01,0.2301055908203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,32,power_law_1.2,0.2040895938873291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,32,power_law_1.2,0.20906879901885986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,4,balanced,1.2845333417256672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,4,balanced,1.2860639890034993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,4,power_law_1.01,0.9692159652709961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,4,power_law_1.01,1.1461119651794434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,4,power_law_1.2,0.9743935585021972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,4,power_law_1.2,1.0471551895141602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,64,balanced,0.1546026666959127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,64,balanced,0.15537066260973612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,64,power_law_1.01,0.13623679876327516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,64,power_law_1.01,0.14426239728927612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,64,power_law_1.2,0.14131840467453002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,64,power_law_1.2,0.14916479587554932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,8,balanced,0.6951306660970052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,8,balanced,0.696074644724528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,8,power_law_1.01,0.5760447978973389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,8,power_law_1.01,0.6606719970703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,8,power_law_1.2,0.6455423831939697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,1,8,power_law_1.2,0.6777535915374756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,16,1,balanced,0.5227466821670532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,16,1,balanced,0.5228426853815714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,16,1,power_law_1.01,0.3634239912033081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,16,1,power_law_1.01,0.3656320095062256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,16,1,power_law_1.2,0.3537856101989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,16,1,power_law_1.2,0.3575360059738159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,2,1,balanced,2.6044480005900064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,2,1,balanced,2.622741381327311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,2,1,power_law_1.01,1.6860416412353516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,2,1,power_law_1.01,1.7139392852783204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,2,1,power_law_1.2,1.662131118774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,2,1,power_law_1.2,1.6783744812011718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,32,1,balanced,0.4301226536432902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,32,1,balanced,0.43518932660420734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,32,1,power_law_1.01,0.2844928026199341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,32,1,power_law_1.01,0.2881088018417358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,32,1,power_law_1.2,0.2791424036026001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,32,1,power_law_1.2,0.2793920040130615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,4,1,balanced,1.3493332862854004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,4,1,balanced,1.3523732821146648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,4,1,power_law_1.01,0.918336009979248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,4,1,power_law_1.01,0.9198080062866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,4,1,power_law_1.2,0.8778495788574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,4,1,power_law_1.2,0.8943231582641602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,8,1,balanced,0.8049759864807129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,8,1,balanced,0.8053173224131266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,8,1,power_law_1.01,0.5598976135253906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,8,1,power_law_1.01,0.5647488117218018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,8,1,power_law_1.2,0.5472256183624268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,64,7168,2048,8,384,8,1,power_law_1.2,0.5526591777801514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,1,balanced,0.25685866673787433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,1,balanced,0.2578879992167155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,1,power_law_1.01,0.2797951936721802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,1,power_law_1.01,0.2848320007324219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,1,power_law_1.2,0.2841088056564331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,1,power_law_1.2,0.28641281127929685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,128,balanced,0.07037333150704701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,128,balanced,0.07049599786599477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,128,power_law_1.01,0.07238399982452393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,128,power_law_1.01,0.07347840070724487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,128,power_law_1.2,0.07516800165176392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,128,power_law_1.2,0.07771520018577575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,16,balanced,0.08724266290664673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,16,balanced,0.08893332878748576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,16,power_law_1.01,0.08782079815864563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,16,power_law_1.01,0.0883520007133484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,16,power_law_1.2,0.09071999788284302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,2,balanced,0.1888320048650106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,2,balanced,0.19262933731079102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,2,power_law_1.01,0.1987712025642395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,2,power_law_1.01,0.20279040336608886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,2,power_law_1.2,0.2035968065261841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,2,power_law_1.2,0.20880000591278075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,32,balanced,0.07765866816043854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,32,balanced,0.07931733131408691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,32,power_law_1.01,0.07991039752960205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,32,power_law_1.01,0.08001919984817504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,32,power_law_1.2,0.08047360181808472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,32,power_law_1.2,0.08384000062942505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,4,balanced,0.13564800222714743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,4,balanced,0.13621333241462708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,4,power_law_1.01,0.13753600120544435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,4,power_law_1.01,0.13898240327835082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,4,power_law_1.2,0.14028799533843994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,4,power_law_1.2,0.14071040153503417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,64,balanced,0.07308800021807353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,64,balanced,0.0746559997399648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,64,power_law_1.01,0.07333760261535645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,64,power_law_1.01,0.07539839744567871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,64,power_law_1.2,0.0767359972000122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,64,power_law_1.2,0.07676799893379212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,8,balanced,0.1000426709651947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,8,balanced,0.10107200344403584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,8,power_law_1.01,0.10536960363388062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,8,power_law_1.01,0.10595840215682983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,8,power_law_1.2,0.10679039955139161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,1,8,power_law_1.2,0.11230080127716065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,2,1,balanced,0.18056533734003702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,2,1,balanced,0.18167465925216675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,2,1,power_law_1.01,0.18133759498596191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,2,1,power_law_1.01,0.18599679470062255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,2,1,power_law_1.2,0.1977280020713806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,2,1,power_law_1.2,0.19788800477981566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,4,1,balanced,0.13151466846466064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,4,1,balanced,0.13154666622479758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,4,1,power_law_1.01,0.13502720594406128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,4,1,power_law_1.01,0.13537919521331787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,4,1,power_law_1.2,0.1371840000152588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2048,768,8,128,4,1,power_law_1.2,0.1373311996459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,1,balanced,0.6717226505279541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,1,balanced,0.6817653179168701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,1,power_law_1.01,0.6993023872375488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,1,power_law_1.01,0.7065792083740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,1,power_law_1.2,0.7233920097351074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,1,power_law_1.2,0.7322879791259765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,128,balanced,0.09807466467221577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,128,balanced,0.10081066687901814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,128,power_law_1.01,0.10041600465774536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,128,power_law_1.01,0.10167039632797241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,128,power_law_1.2,0.10224000215530396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,128,power_law_1.2,0.10377600193023681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,16,balanced,0.13596266508102417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,16,balanced,0.1362506647904714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,16,power_law_1.01,0.1463744044303894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,16,power_law_1.2,0.15362559556961058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,16,power_law_1.2,0.15423359870910644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,2,balanced,0.44310931364695233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,2,balanced,0.44341333707173664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,2,power_law_1.01,0.4488639831542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,2,power_law_1.01,0.46381440162658694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,2,power_law_1.2,0.45681281089782716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,2,power_law_1.2,0.4696512222290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,32,balanced,0.11346667011578877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,32,balanced,0.1141973336537679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,32,power_law_1.01,0.1176576018333435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,32,power_law_1.01,0.11956479549407958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,32,power_law_1.2,0.1207360029220581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,32,power_law_1.2,0.12215039730072022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,4,balanced,0.27400000890096027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,4,balanced,0.2752319971720378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,4,power_law_1.01,0.2718656063079834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,4,power_law_1.01,0.2758143901824951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,4,power_law_1.2,0.2790208101272583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,4,power_law_1.2,0.2827647924423218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,64,balanced,0.10325866937637329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,64,balanced,0.10481066505114238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,64,power_law_1.01,0.10791679620742797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,64,power_law_1.01,0.10854400396347046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,64,power_law_1.2,0.1110975980758667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,64,power_law_1.2,0.11148159503936768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,8,balanced,0.1857866644859314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,8,balanced,0.1867146690686544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,8,power_law_1.01,0.1920192003250122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,8,power_law_1.01,0.1938688039779663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,8,power_law_1.2,0.19163520336151124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,1,8,power_law_1.2,0.1936511993408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,16,1,balanced,0.2694666584332784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,16,1,balanced,0.2709280053774516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,16,1,power_law_1.01,0.276147198677063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,16,1,power_law_1.01,0.27762560844421386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,16,1,power_law_1.2,0.28256640434265134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,16,1,power_law_1.2,0.28419198989868166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,2,1,balanced,0.4347999890645345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,2,1,balanced,0.434928019841512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,2,1,power_law_1.01,0.43061118125915526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,2,1,power_law_1.01,0.4314752101898193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,2,1,power_law_1.2,0.4459072113037109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,2,1,power_law_1.2,0.45499520301818847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,32,1,balanced,0.21585599581400552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,32,1,balanced,0.21656533082326254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,32,1,power_law_1.01,0.22284159660339356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,32,1,power_law_1.01,0.22410240173339843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,32,1,power_law_1.2,0.22961280345916749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,32,1,power_law_1.2,0.2297152042388916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,4,1,balanced,0.26495466629664105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,4,1,balanced,0.2658986647923787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,4,1,power_law_1.01,0.26562559604644775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,4,1,power_law_1.01,0.2656831979751587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,4,1,power_law_1.2,0.26890881061553956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,4,1,power_law_1.2,0.27036800384521487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,8,1,balanced,0.3539946476618449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,8,1,balanced,0.3553493420283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,8,1,power_law_1.01,0.3650496006011963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,8,1,power_law_1.01,0.36510720252990725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,8,1,power_law_1.2,0.37404799461364746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,2688,1856,6,128,8,1,power_law_1.2,0.37431039810180666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,1,balanced,1.3938560485839844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,1,balanced,1.4428693453470867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,1,power_law_1.01,1.2872703552246094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,1,power_law_1.01,1.294713592529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,1,power_law_1.2,1.3467519760131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,1,power_law_1.2,1.3819199562072755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,128,balanced,0.13994133472442627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,128,balanced,0.14017599821090698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,128,power_law_1.01,0.14152319431304933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,128,power_law_1.01,0.1415743947029114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,128,power_law_1.2,0.1428287982940674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,128,power_law_1.2,0.14365439414978026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,16,balanced,0.21701333920160928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,16,balanced,0.21785066525141397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,16,power_law_1.01,0.21621758937835694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,16,power_law_1.01,0.2179840087890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,16,power_law_1.2,0.21855359077453612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,16,power_law_1.2,0.21993598937988282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,2,balanced,0.7699626286824545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,2,balanced,0.771888017654419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,2,power_law_1.01,0.7148416042327881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,2,power_law_1.01,0.7451200008392334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,2,power_law_1.2,0.7392831802368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,2,power_law_1.2,0.7584959983825683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,256,balanced,0.1341386636098226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,256,balanced,0.13530133167902628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,256,power_law_1.01,0.13735040426254272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,256,power_law_1.01,0.13806079626083373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,256,power_law_1.2,0.13805439472198486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,256,power_law_1.2,0.13904639482498168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,32,balanced,0.1707893411318461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,32,balanced,0.17083199818929037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,32,power_law_1.01,0.1699903964996338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,32,power_law_1.01,0.17441920042037964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,32,power_law_1.2,0.17527040243148803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,32,power_law_1.2,0.17567360401153564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,4,balanced,0.4599519968032837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,4,balanced,0.4613120158513387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,4,power_law_1.01,0.43245439529418944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,4,power_law_1.01,0.44231038093566893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,4,power_law_1.2,0.4489408016204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,4,power_law_1.2,0.45844478607177735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,64,balanced,0.14958932995796204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,64,balanced,0.14966932932535806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,64,power_law_1.01,0.15054719448089598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,64,power_law_1.01,0.15134079456329347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,64,power_law_1.2,0.1521664023399353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,64,power_law_1.2,0.15562880039215088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,8,balanced,0.29739199082056683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,8,balanced,0.29841067393620807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,8,power_law_1.01,0.2883008003234863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,8,power_law_1.01,0.2896960020065308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,8,power_law_1.2,0.2966079950332642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,1,8,power_law_1.2,0.30531198978424073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,16,1,balanced,0.22426132361094156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,16,1,balanced,0.2254026730855306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,16,1,power_law_1.01,0.2165247917175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,16,1,power_law_1.01,0.21799039840698242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,16,1,power_law_1.2,0.22169599533081055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,16,1,power_law_1.2,0.22451200485229492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,2,1,balanced,0.7579039732615153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,2,1,balanced,0.7581706841786703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,2,1,power_law_1.01,0.7015039920806885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,2,1,power_law_1.01,0.7035200119018554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,2,1,power_law_1.2,0.7440896034240723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,2,1,power_law_1.2,0.7519296169281006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,32,1,balanced,0.17504000663757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,32,1,balanced,0.17654399077097574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,32,1,power_law_1.01,0.17176320552825927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,32,1,power_law_1.01,0.17230720520019532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,32,1,power_law_1.2,0.17550079822540282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,32,1,power_law_1.2,0.1759935975074768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,4,1,balanced,0.44815464814503986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,4,1,balanced,0.44898664951324463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,4,1,power_law_1.01,0.40826878547668455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,4,1,power_law_1.01,0.41709442138671876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,4,1,power_law_1.2,0.4423359870910645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,4,1,power_law_1.2,0.4457727909088135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,8,1,balanced,0.28758400678634644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,8,1,balanced,0.28781867027282715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,8,1,power_law_1.01,0.278438401222229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,8,1,power_law_1.01,0.2796992063522339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,8,1,power_law_1.2,0.281439995765686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,3072,1536,8,256,8,1,power_law_1.2,0.28190720081329346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,1,balanced,1.01255464553833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,1,balanced,1.0190506776173909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,1,power_law_1.01,1.0531904220581054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,1,power_law_1.01,1.054092788696289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,1,power_law_1.2,1.0892864227294923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,1,power_law_1.2,1.0965312004089356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,2,balanced,0.5225653251012167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,2,balanced,0.5246346791585287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,2,power_law_1.01,0.5704703807830811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,2,power_law_1.01,0.6970687866210937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,2,power_law_1.2,0.6571519851684571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,2,power_law_1.2,0.6646463871002197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,4,balanced,0.37253332138061523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,4,balanced,0.3747573296229045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,4,power_law_1.01,0.43495678901672363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,4,power_law_1.01,0.5025792121887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,4,power_law_1.2,0.4622464179992676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,4,power_law_1.2,0.465561580657959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,8,balanced,0.3027946750322978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,8,balanced,0.3028266628583272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,8,power_law_1.01,0.3780352115631104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,8,power_law_1.01,0.38574719429016113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,8,power_law_1.2,0.3972223997116089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,1,8,power_law_1.2,0.39816319942474365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,16,1,balanced,0.09727467099825542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,16,1,balanced,0.09730666875839233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,16,1,power_law_1.01,0.09761279821395874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,16,1,power_law_1.01,0.09813759922981262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,16,1,power_law_1.2,0.09702399969100953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,16,1,power_law_1.2,0.09770879745483399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,2,1,balanced,0.5050026575724283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,2,1,balanced,0.5081813335418701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,2,1,power_law_1.01,0.5106624126434326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,2,1,power_law_1.01,0.52291841506958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,2,1,power_law_1.2,0.5154751777648926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,2,1,power_law_1.2,0.523302412033081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,32,1,balanced,0.08102933565775554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,32,1,balanced,0.0820906658967336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,32,1,power_law_1.01,0.08158079981803894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,32,1,power_law_1.01,0.08173440098762512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,32,1,power_law_1.2,0.0813759982585907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,32,1,power_law_1.2,0.08145920038223267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,4,1,balanced,0.2766186594963074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,4,1,balanced,0.27712533871332806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,4,1,power_law_1.01,0.27721600532531737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,4,1,power_law_1.01,0.2845632076263428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,4,1,power_law_1.2,0.2813184022903442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,4,1,power_law_1.2,0.28458878993988035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,8,1,balanced,0.15945067008336386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,8,1,balanced,0.16105600198109946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,8,1,power_law_1.01,0.1584831953048706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,8,1,power_law_1.01,0.15877759456634521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,8,1,power_law_1.2,0.15694719552993774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,14336,2,8,8,1,power_law_1.2,0.1592576026916504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,1,balanced,0.9608213106791178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,1,balanced,0.9641866683959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,1,power_law_1.01,0.9998271942138672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,1,power_law_1.01,1.0337151527404784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,1,power_law_1.2,1.0476544380187989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,1,power_law_1.2,1.0531840324401855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,128,balanced,0.13359466195106506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,128,balanced,0.13385599851608276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,128,power_law_1.01,0.13322880268096923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,128,power_law_1.01,0.1335360050201416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,128,power_law_1.2,0.1362239956855774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,128,power_law_1.2,0.13841279745101928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,16,balanced,0.1693333387374878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,16,balanced,0.170741339524587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,16,power_law_1.01,0.1814784049987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,16,power_law_1.01,0.18442239761352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,16,power_law_1.2,0.19368319511413573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,16,power_law_1.2,0.19606399536132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,2,balanced,0.5598560174306234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,2,balanced,0.5609066486358643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,2,power_law_1.01,0.58373122215271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,2,power_law_1.01,0.5876736164093017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,2,power_law_1.2,0.5922560214996337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,2,power_law_1.2,0.6054463863372803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,32,balanced,0.14593600233395895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,32,balanced,0.1471733351548513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,32,power_law_1.01,0.15358079671859742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,32,power_law_1.01,0.1555008053779602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,32,power_law_1.2,0.15856000185012817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,32,power_law_1.2,0.15935360193252562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,4,balanced,0.3323040008544922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,4,balanced,0.3333226641019185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,4,power_law_1.01,0.3640064001083374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,4,power_law_1.01,0.3714688062667847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,4,power_law_1.2,0.37236480712890624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,4,power_law_1.2,0.37747199535369874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,64,balanced,0.13729066650072733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,64,balanced,0.13902399937311807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,64,power_law_1.01,0.13982720375061036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,64,power_law_1.01,0.14035199880599974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,64,power_law_1.2,0.14338560104370118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,64,power_law_1.2,0.14540159702301025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,8,balanced,0.2343626618385315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,8,balanced,0.23508799076080322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,8,power_law_1.01,0.24117119312286378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,8,power_law_1.01,0.24528000354766846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,8,power_law_1.2,0.24453120231628417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,1,8,power_law_1.2,0.25109119415283204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,16,1,balanced,0.17402666807174683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,16,1,balanced,0.1743626594543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,16,1,power_law_1.01,0.18297599554061889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,16,1,power_law_1.01,0.18423680067062378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,16,1,power_law_1.2,0.20289919376373292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,16,1,power_law_1.2,0.20290560722351075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,2,1,balanced,0.46829867362976074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,2,1,balanced,0.47358934084574383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,2,1,power_law_1.01,0.5053760051727295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,2,1,power_law_1.01,0.527891206741333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,2,1,power_law_1.2,0.5271039962768554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,2,1,power_law_1.2,0.5321919918060303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,32,1,balanced,0.15451733271280924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,32,1,balanced,0.1551253298918406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,32,1,power_law_1.01,0.15970560312271118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,32,1,power_law_1.01,0.16173440217971802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,32,1,power_law_1.2,0.16320639848709106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,32,1,power_law_1.2,0.1637503981590271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,4,1,balanced,0.31993067264556885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,4,1,balanced,0.3205173412958781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,4,1,power_law_1.01,0.33535358905792234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,4,1,power_law_1.01,0.3461888074874878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,4,1,power_law_1.2,0.3587455987930298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,4,1,power_law_1.2,0.35964159965515136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,8,1,balanced,0.22843199968338013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,8,1,balanced,0.23271467288335165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,8,1,power_law_1.01,0.2350912094116211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,8,1,power_law_1.01,0.23584001064300536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,8,1,power_law_1.2,0.23705599308013917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,1536,8,128,8,1,power_law_1.2,0.240012788772583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,1,balanced,6.395680109659831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,1,balanced,6.405391693115234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,1,power_law_1.01,6.459500885009765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,1,power_law_1.01,6.5352638244628904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,1,power_law_1.2,6.668851470947265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,1,power_law_1.2,7.062438201904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,128,balanced,0.46537065505981445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,128,balanced,0.46537601947784424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,128,power_law_1.01,0.4814720153808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,128,power_law_1.01,0.487775993347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,128,power_law_1.2,0.4900224208831787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,128,power_law_1.2,0.4976640224456787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,16,balanced,0.7900533676147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,16,balanced,0.792522668838501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,16,power_law_1.01,0.8079936027526855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,16,power_law_1.01,0.8108991622924805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,16,power_law_1.2,0.8415552139282226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,16,power_law_1.2,0.8434816360473633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,2,balanced,3.32698663075765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,2,balanced,3.5998827616373696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,2,power_law_1.01,3.5000446319580076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,2,power_law_1.01,3.500102233886719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,2,power_law_1.2,3.4795265197753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,2,power_law_1.2,3.584128189086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,256,balanced,0.44759468237559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,256,balanced,0.44780266284942627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,256,power_law_1.01,0.45864319801330566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,256,power_law_1.01,0.46110081672668457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,256,power_law_1.2,0.4643968105316162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,256,power_law_1.2,0.47246079444885253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,32,balanced,0.6119466622670492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,32,balanced,0.6145333449045817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,32,power_law_1.01,0.6326848030090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,32,power_law_1.01,0.633568000793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,32,power_law_1.2,0.6343935966491699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,32,power_law_1.2,0.6500607967376709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,4,balanced,1.8866346677144368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,4,balanced,1.8989760080973308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,4,power_law_1.01,1.8978048324584962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,4,power_law_1.01,1.9252096176147462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,4,power_law_1.2,1.8919551849365235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,4,power_law_1.2,1.9801088333129884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,64,balanced,0.5227893193562826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,64,balanced,0.5245706637700399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,64,power_law_1.01,0.5372288227081299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,64,power_law_1.01,0.5427328109741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,64,power_law_1.2,0.5383808135986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,64,power_law_1.2,0.5475264072418213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,8,balanced,1.1640373071034749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,8,balanced,1.164346694946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,8,power_law_1.01,1.1753024101257323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,8,power_law_1.01,1.1835007667541504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,8,power_law_1.2,1.1950079917907714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,1,8,power_law_1.2,1.2267583847045898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,16,1,balanced,1.6479679743448894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,16,1,balanced,1.6482666333516438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,16,1,power_law_1.01,1.6659967422485351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,16,1,power_law_1.01,1.6755968093872071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,16,1,power_law_1.2,1.7251903533935546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,16,1,power_law_1.2,1.7434816360473633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,2,1,balanced,2.8363733291625977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,2,1,balanced,2.8503039677937827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,2,1,power_law_1.01,2.916652870178223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,2,1,power_law_1.01,2.9592639923095705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,2,1,power_law_1.2,3.00064640045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,2,1,power_law_1.2,3.1251903533935548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,32,1,balanced,1.3991039594014485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,32,1,balanced,1.4016373952229817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,32,1,power_law_1.01,1.4433088302612305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,32,1,power_law_1.01,1.44717435836792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,32,1,power_law_1.2,1.5069696426391601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,32,1,power_law_1.2,1.510912036895752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,4,1,balanced,2.6231306393941245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,4,1,balanced,2.7162081400553384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,4,1,power_law_1.01,2.405548858642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,4,1,power_law_1.01,2.4243263244628905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,4,1,power_law_1.2,2.4267263412475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,4,1,power_law_1.2,2.4514047622680666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,8,1,balanced,1.0771466890970867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,8,1,balanced,1.0785600344340007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,8,1,power_law_1.01,1.0719167709350585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,8,1,power_law_1.01,1.0791104316711426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,8,1,power_law_1.2,1.1144384384155273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,4096,2688,22,512,8,1,power_law_1.2,1.1263615608215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,1,balanced,1.7463946342468262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,1,balanced,1.8131945927937825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,1,power_law_1.01,1.7948480606079102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,1,power_law_1.01,1.8315135955810546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,1,power_law_1.2,1.7426944732666017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,1,power_law_1.2,1.7722623825073243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,2,balanced,0.862938642501831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,2,balanced,0.8671092987060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,2,power_law_1.01,1.0674304008483886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,2,power_law_1.01,1.0859328269958497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,2,power_law_1.2,1.0177215576171874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,2,power_law_1.2,1.0858816146850585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,4,balanced,0.5010613203048706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,4,balanced,0.5032533407211304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,4,power_law_1.01,0.8260416030883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,4,power_law_1.01,0.8332927703857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,4,power_law_1.2,0.6649407863616943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,4,power_law_1.2,0.8349823951721191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,8,balanced,0.3779146671295166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,8,balanced,0.3786666790644328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,8,power_law_1.01,0.5385216236114502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,8,power_law_1.01,0.5503488063812256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,8,power_law_1.2,0.5482880115509033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,1,8,power_law_1.2,0.5655744075775146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,16,1,balanced,0.13507733742396036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,16,1,balanced,0.13597866892814636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,16,1,power_law_1.01,0.1386240005493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,16,1,power_law_1.01,0.13896960020065308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,16,1,power_law_1.2,0.14062080383300782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,16,1,power_law_1.2,0.14094079732894899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,2,1,balanced,0.8012906710306803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,2,1,balanced,0.8139999707539877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,2,1,power_law_1.01,0.826956844329834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,2,1,power_law_1.01,0.8468607902526856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,2,1,power_law_1.2,0.8503104209899902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,2,1,power_law_1.2,0.8548671722412109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,32,1,balanced,0.11249599854151408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,32,1,balanced,0.11303466558456421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,32,1,power_law_1.01,0.11509759426116943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,32,1,power_law_1.01,0.11576319932937622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,32,1,power_law_1.2,0.1158784031867981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,32,1,power_law_1.2,0.11630079746246338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,4,1,balanced,0.4235200087229411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,4,1,balanced,0.43111467361450195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,4,1,power_law_1.01,0.42824320793151854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,4,1,power_law_1.01,0.4310463905334473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,4,1,power_law_1.2,0.4335360050201416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,4,1,power_law_1.2,0.43802242279052733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,8,1,balanced,0.2278346618016561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,8,1,balanced,0.23069334030151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,8,1,power_law_1.01,0.23349759578704835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,8,1,power_law_1.01,0.2338495969772339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,8,1,power_law_1.2,0.2312000036239624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,16384,2,8,8,1,power_law_1.2,0.24360320568084717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,1,balanced,3.496373176574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,1,balanced,3.861845334370931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,1,power_law_1.01,3.3927040100097656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,1,power_law_1.01,3.428083038330078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,1,power_law_1.2,3.5498367309570313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,1,power_law_1.2,3.6070014953613283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,128,balanced,0.23172799746195474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,128,balanced,0.23221866289774576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,128,power_law_1.01,0.23497600555419923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,128,power_law_1.01,0.23998720645904542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,128,power_law_1.2,0.24084479808807374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,128,power_law_1.2,0.24535679817199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,16,balanced,0.416378657023112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,16,balanced,0.4180533488591512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,16,power_law_1.01,0.4174655914306641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,16,power_law_1.01,0.4220223903656006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,16,power_law_1.2,0.4149695873260498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,16,power_law_1.2,0.42543997764587405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,2,balanced,1.8689014116923015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,2,balanced,1.9784639676411946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,2,power_law_1.01,1.7613439559936523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,2,power_law_1.01,1.7686527252197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,2,power_law_1.2,1.8181631088256835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,2,power_law_1.2,1.8521152496337892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,256,balanced,0.2215786576271057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,256,balanced,0.2226453423500061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,256,power_law_1.01,0.22622079849243165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,256,power_law_1.01,0.22689919471740722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,256,power_law_1.2,0.23009281158447265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,256,power_law_1.2,0.2330496072769165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,32,balanced,0.315226674079895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,32,balanced,0.315610667069753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,32,power_law_1.01,0.3180416107177734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,32,power_law_1.01,0.3251967906951904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,32,power_law_1.2,0.3265791893005371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,32,power_law_1.2,0.3297919988632202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,4,balanced,1.0400853157043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,4,balanced,1.0451947053273518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,4,power_law_1.01,0.9654463768005371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,4,power_law_1.01,0.9896063804626465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,4,power_law_1.2,1.0355263710021974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,4,power_law_1.2,1.035852813720703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,64,balanced,0.25304534037907916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,64,balanced,0.25437333186467487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,64,power_law_1.01,0.26528000831604004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,64,power_law_1.01,0.2657023906707764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,64,power_law_1.2,0.26998400688171387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,64,power_law_1.2,0.2713279962539673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,8,balanced,0.6241653362909952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,8,balanced,0.6253866751988729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,8,power_law_1.01,0.5872191905975341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,8,power_law_1.01,0.6142591953277587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,8,power_law_1.2,0.6247488021850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,1,8,power_law_1.2,0.6500607967376709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,16,1,balanced,0.4249226649602254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,16,1,balanced,0.4249759912490845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,16,1,power_law_1.01,0.40889601707458495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,16,1,power_law_1.01,0.4115839958190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,16,1,power_law_1.2,0.4190207958221436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,16,1,power_law_1.2,0.4214655876159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,2,1,balanced,1.9001493453979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,2,1,balanced,1.9602986971537273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,2,1,power_law_1.01,1.7171648025512696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,2,1,power_law_1.01,1.7531200408935548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,2,1,power_law_1.2,1.8078784942626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,2,1,power_law_1.2,1.8337087631225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,32,1,balanced,0.32636799414952594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,32,1,balanced,0.3291520078976949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,32,1,power_law_1.01,0.31623039245605467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,32,1,power_law_1.01,0.3190783977508545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,32,1,power_law_1.2,0.32401280403137206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,32,1,power_law_1.2,0.3270848035812378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,4,1,balanced,1.0107946395874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,4,1,balanced,1.0132479667663574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,4,1,power_law_1.01,0.967801570892334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,4,1,power_law_1.01,0.9703488349914551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,4,1,power_law_1.2,0.9913087844848633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,4,1,power_law_1.2,1.0150591850280761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,8,1,balanced,0.6303199927012125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,8,1,balanced,0.6317386627197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,8,1,power_law_1.01,0.6088640213012695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,8,1,power_law_1.01,0.6113408088684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,8,1,power_law_1.2,0.617523193359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2048,8,256,8,1,power_law_1.2,0.625497579574585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,1,balanced,2.7825867335001626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,1,balanced,2.786773363749186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,1,power_law_1.01,2.955295944213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,1,power_law_1.01,3.1012928009033205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,1,power_law_1.2,3.1032896041870117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,1,power_law_1.2,3.1052032470703126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,16,balanced,0.3451626698176066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,16,balanced,0.3474133412043254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,16,power_law_1.01,0.36986238956451417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,16,power_law_1.01,0.3808831930160522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,16,power_law_1.2,0.3793855905532837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,16,power_law_1.2,0.40833277702331544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,2,balanced,1.4908053080240886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,2,balanced,1.5365440050760906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,2,power_law_1.01,1.54335355758667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,2,power_law_1.01,1.5506688117980958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,2,power_law_1.2,1.5767552375793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,2,power_law_1.2,1.6218816757202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,32,balanced,0.2587946653366089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,32,balanced,0.25910399357477826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,32,power_law_1.01,0.2858112096786499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,32,power_law_1.01,0.2863296031951904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,32,power_law_1.2,0.29582719802856444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,32,power_law_1.2,0.30439679622650145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,4,balanced,0.8353973229726156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,4,balanced,0.8356640338897705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,4,power_law_1.01,0.8725503921508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,4,power_law_1.01,0.8875712394714356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,4,power_law_1.2,0.8983488082885742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,4,power_law_1.2,0.9172991752624512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,8,balanced,0.5073173443476359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,8,balanced,0.5080533425013224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,8,power_law_1.01,0.5408448219299317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,8,power_law_1.01,0.5460288047790527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,8,power_law_1.2,0.5514495849609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,1,8,power_law_1.2,0.5631423950195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,16,1,balanced,0.34862399101257324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,16,1,balanced,0.3498026529947917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,16,1,power_law_1.01,0.3523967981338501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,16,1,power_law_1.01,0.3547071933746338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,16,1,power_law_1.2,0.3591936111450195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,16,1,power_law_1.2,0.36154880523681643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,2,1,balanced,1.470746676127116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,2,1,balanced,1.548437277475993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,2,1,power_law_1.01,1.507040023803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,2,1,power_law_1.01,1.5154239654541015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,2,1,power_law_1.2,1.5325823783874513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,2,1,power_law_1.2,1.5671680450439454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,32,1,balanced,0.31242666641871136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,32,1,balanced,0.3142079909642537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,32,1,power_law_1.01,0.3199359893798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,32,1,power_law_1.01,0.32027521133422854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,32,1,power_law_1.2,0.32247679233551024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,32,1,power_law_1.2,0.32471039295196535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,4,1,balanced,0.8198293050130209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,4,1,balanced,0.8251199722290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,4,1,power_law_1.01,0.8196096420288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,4,1,power_law_1.01,0.8203904151916503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,4,1,power_law_1.2,0.8424768447875977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,4,1,power_law_1.2,0.857209587097168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,8,1,balanced,0.483354647954305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,8,1,balanced,0.4853813250859578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,8,1,power_law_1.01,0.4895808219909668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,8,1,power_law_1.01,0.5015615940093994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,8,1,power_law_1.2,0.5112192153930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,6144,2560,8,160,8,1,power_law_1.2,0.5330304145812989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,1,balanced,4.088399887084961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,1,balanced,4.0929867426554365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,1,power_law_1.01,3.7689983367919924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,1,power_law_1.01,3.7895999908447267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,1,power_law_1.2,3.9530624389648437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,1,power_law_1.2,4.277376174926758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,128,balanced,0.26121066013971966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,128,balanced,0.2613439957300822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,128,power_law_1.01,0.2583744049072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,128,power_law_1.01,0.2621632099151611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,128,power_law_1.2,0.2654655933380127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,128,power_law_1.2,0.27035520076751707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,16,balanced,0.4724533160527547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,16,balanced,0.4734826485315959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,16,power_law_1.01,0.4644480228424072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,16,power_law_1.01,0.47545599937438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,16,power_law_1.2,0.485203218460083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,16,power_law_1.2,0.4943295955657959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,2,balanced,2.2211999893188477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,2,balanced,2.2601706186930337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,2,power_law_1.01,1.9821311950683593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,2,power_law_1.01,2.115648078918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,2,power_law_1.2,2.1523775100708007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,2,power_law_1.2,2.1792768478393554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,256,balanced,0.2526613275210063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,256,balanced,0.2544479966163635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,256,power_law_1.01,0.2515775918960571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,256,power_law_1.01,0.25179519653320315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,256,power_law_1.2,0.2538687944412231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,256,power_law_1.2,0.2547584056854248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,32,balanced,0.34886399904886883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,32,balanced,0.3526506821314494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,32,power_law_1.01,0.3579967975616455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,32,power_law_1.01,0.3661056041717529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,32,power_law_1.2,0.3666176080703735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,32,power_law_1.2,0.3701312065124512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,4,balanced,1.2048106988271077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,4,balanced,1.2049226760864258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,4,power_law_1.01,1.103769588470459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,4,power_law_1.01,1.1802111625671388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,4,power_law_1.2,1.2008255958557128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,4,power_law_1.2,1.226956844329834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,64,balanced,0.2807413339614868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,64,balanced,0.2810399929682414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,64,power_law_1.01,0.28726398944854736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,64,power_law_1.01,0.2914367914199829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,64,power_law_1.2,0.3011647939682007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,64,power_law_1.2,0.30570240020751954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,8,balanced,0.7155199845631918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,8,balanced,0.716426690419515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,8,power_law_1.01,0.6971263885498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,8,power_law_1.01,0.6998400211334228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,8,power_law_1.2,0.7112959861755371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,1,8,power_law_1.2,0.7234240055084229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,16,1,balanced,0.4914453426996867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,16,1,balanced,0.4923786719640096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,16,1,power_law_1.01,0.47458558082580565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,16,1,power_law_1.01,0.4765376091003418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,16,1,power_law_1.2,0.4882815837860107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,16,1,power_law_1.2,0.48908162117004395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,2,1,balanced,2.266197363535563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,2,1,balanced,2.3191839853922525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,2,1,power_law_1.01,2.016543960571289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,2,1,power_law_1.01,2.086924743652344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,2,1,power_law_1.2,2.1507007598876955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,2,1,power_law_1.2,2.193600082397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,32,1,balanced,0.3741866747538249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,32,1,balanced,0.37547731399536133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,32,1,power_law_1.01,0.36801919937133787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,32,1,power_law_1.01,0.3687040090560913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,32,1,power_law_1.2,0.37507200241088867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,32,1,power_law_1.2,0.3791680097579956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,4,1,balanced,1.1741920312245686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,4,1,balanced,1.203386704126994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,4,1,power_law_1.01,1.1183232307434081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,4,1,power_law_1.01,1.1283072471618651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,4,1,power_law_1.2,1.1584128379821776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,4,1,power_law_1.2,1.1773247718811035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,8,1,balanced,0.7328000068664551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,8,1,balanced,0.7347520192464193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,8,1,power_law_1.01,0.7036416053771972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,8,1,power_law_1.01,0.713324785232544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,8,1,power_law_1.2,0.7161600112915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,256,8,1,power_law_1.2,0.7244991779327392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,1,balanced,6.602336247762044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,1,balanced,6.664469401041667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,1,power_law_1.01,5.244672012329102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,1,power_law_1.01,5.393439865112304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,1,power_law_1.2,5.773177719116211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,1,power_law_1.2,5.805126571655274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,128,balanced,0.32517866293589276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,128,balanced,0.32571200529734295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,128,power_law_1.01,0.31729280948638916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,128,power_law_1.01,0.3224064111709595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,128,power_law_1.2,0.3325567960739136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,128,power_law_1.2,0.336409592628479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,16,balanced,0.6467039982477824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,16,balanced,0.6477760076522827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,16,power_law_1.01,0.5868480205535889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,16,power_law_1.01,0.609388780593872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,16,power_law_1.2,0.6252543926239014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,16,power_law_1.2,0.6269824028015136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,2,balanced,3.3720480600992837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,2,balanced,3.43829345703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,2,power_law_1.01,2.7188159942626955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,2,power_law_1.01,2.782547187805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,2,power_law_1.2,2.894272041320801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,2,power_law_1.2,2.944825553894043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,32,balanced,0.4737173318862915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,32,balanced,0.47438931465148926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,32,power_law_1.01,0.4539072036743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,32,power_law_1.01,0.4590144157409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,32,power_law_1.2,0.4646143913269043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,32,power_law_1.2,0.4679872035980225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,4,balanced,1.7357279459635417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,4,balanced,1.7413333257039387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,4,power_law_1.01,1.5424127578735352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,4,power_law_1.01,1.5469440460205077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,4,power_law_1.2,1.5769536018371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,4,power_law_1.2,1.585439968109131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,64,balanced,0.37116265296936035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,64,balanced,0.3712426821390788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,64,power_law_1.01,0.3597248077392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,64,power_law_1.01,0.3714303970336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,64,power_law_1.2,0.36885120868682864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,64,power_law_1.2,0.37518720626831054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,8,balanced,1.0198240280151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,8,balanced,1.0204479694366455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,8,power_law_1.01,0.9035264015197754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,8,power_law_1.01,0.9659839630126953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,8,power_law_1.2,0.8827712059020996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,1,8,power_law_1.2,0.9228672027587891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,16,1,balanced,0.701317310333252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,16,1,balanced,0.7016426722208658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,16,1,power_law_1.01,0.6528831958770752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,16,1,power_law_1.01,0.6549056053161622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,16,1,power_law_1.2,0.6551296234130859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,16,1,power_law_1.2,0.6622015953063964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,2,1,balanced,3.3286720911661782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,2,1,balanced,3.3679466247558594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,2,1,power_law_1.01,2.7412351608276366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,2,1,power_law_1.01,2.7534528732299806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,2,1,power_law_1.2,2.8428415298461913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,2,1,power_law_1.2,2.8470272064208983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,32,1,balanced,0.5580426851908366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,32,1,balanced,0.5580693483352661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,32,1,power_law_1.01,0.5110911846160888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,32,1,power_law_1.01,0.5215936183929444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,32,1,power_law_1.2,0.5225791931152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,32,1,power_law_1.2,0.5291391849517822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,4,1,balanced,1.7769546508789062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,4,1,balanced,1.8406933148701985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,4,1,power_law_1.01,1.498681640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,4,1,power_law_1.01,1.5356608390808106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,4,1,power_law_1.2,1.5452223777770997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,4,1,power_law_1.2,1.5509440422058105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,8,1,balanced,1.0631732940673828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,8,1,balanced,1.0638133684794109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,8,1,power_law_1.01,0.9271360397338867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,8,1,power_law_1.01,0.9346495628356933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,8,1,power_law_1.2,0.9379584312438964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,768,7168,2048,8,384,8,1,power_law_1.2,0.9469887733459472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,1,balanced,0.12019733587900798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,1,balanced,0.1202880044778188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,1,power_law_1.01,0.09322239756584168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,1,power_law_1.01,0.09493119716644287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,1,power_law_1.2,0.0918720006942749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,1,power_law_1.2,0.09203839898109437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,128,balanced,0.028090665737787884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,128,balanced,0.029194665451844532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,128,power_law_1.01,0.026713600754737853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,128,power_law_1.01,0.028012800216674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,128,power_law_1.2,0.026655998826026917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,128,power_law_1.2,0.02810879945755005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,16,balanced,0.029631999631722767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,16,balanced,0.030293333033720653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,16,power_law_1.01,0.03222399950027466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,16,power_law_1.01,0.03361920118331909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,16,power_law_1.2,0.03136639893054962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,16,power_law_1.2,0.03218559920787811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,2,balanced,0.07797333101431529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,2,balanced,0.0841439962387085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,2,power_law_1.01,0.0720575988292694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,2,power_law_1.01,0.07484800219535828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,2,power_law_1.2,0.06581760048866273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,2,power_law_1.2,0.06651520133018493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,32,balanced,0.02940266579389572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,32,balanced,0.02941333254178365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,32,power_law_1.01,0.02803199887275696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,32,power_law_1.01,0.029318401217460634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,32,power_law_1.2,0.027596798539161683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,32,power_law_1.2,0.028281599283218384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,4,balanced,0.05282133320967356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,4,balanced,0.05346133311589559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,4,power_law_1.01,0.05180799961090088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,4,power_law_1.01,0.05985280275344849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,4,power_law_1.2,0.05141119956970215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,4,power_law_1.2,0.05655679702758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,64,balanced,0.02758399893840154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,64,balanced,0.02846933404604594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,64,power_law_1.01,0.027276799082756042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,64,power_law_1.01,0.027500799298286437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,64,power_law_1.2,0.02680320143699646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,64,power_law_1.2,0.027750399708747864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,8,balanced,0.03555200000603994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,8,balanced,0.035904000202814736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,8,power_law_1.01,0.047295999526977536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,8,power_law_1.01,0.047353601455688475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,8,power_law_1.2,0.04082559943199158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,1,8,power_law_1.2,0.04271360039710999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,2,1,balanced,0.07774933179219563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,2,1,balanced,0.07813333471616109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,2,1,power_law_1.01,0.06758400201797485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,2,1,power_law_1.01,0.06948480010032654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,2,1,power_law_1.2,0.06220160126686096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,2,1,power_law_1.2,0.06471679806709289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,4,1,balanced,0.056736002365748085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,4,1,balanced,0.05774400134881338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,4,1,power_law_1.01,0.04628480076789856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,4,1,power_law_1.01,0.04869759976863861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,4,1,power_law_1.2,0.04517120122909546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2048,768,8,128,4,1,power_law_1.2,0.04668799936771393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,1,balanced,0.24918399254480997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,1,balanced,0.2520479957262675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,1,power_law_1.01,0.20703999996185302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,1,power_law_1.01,0.2129728078842163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,1,power_law_1.2,0.1906496047973633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,1,power_law_1.2,0.19362560510635377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,128,balanced,0.03325333446264267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,128,balanced,0.03382933388153712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,128,power_law_1.01,0.03136639893054962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,128,power_law_1.01,0.031999999284744264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,128,power_law_1.2,0.03187839984893799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,16,balanced,0.04870399832725525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,16,balanced,0.04967466493447622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,16,power_law_1.01,0.06218240261077881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,16,power_law_1.01,0.06780800223350525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,16,power_law_1.2,0.06382079720497132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,16,power_law_1.2,0.0686847984790802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,2,balanced,0.14793599645296732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,2,balanced,0.15067199865976968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,2,power_law_1.01,0.1412608027458191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,2,power_law_1.01,0.1446720004081726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,2,power_law_1.2,0.12303359508514404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,2,power_law_1.2,0.13671679496765138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,32,balanced,0.041493333876132965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,32,balanced,0.041738669077555336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,32,power_law_1.01,0.04141440093517303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,32,power_law_1.01,0.04467200040817261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,32,power_law_1.2,0.04188799858093262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,32,power_law_1.2,0.04429439902305603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,4,balanced,0.09334933757781982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,4,balanced,0.09341333309809367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,4,power_law_1.01,0.1048192024230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,4,power_law_1.01,0.11119999885559081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,4,power_law_1.2,0.09669119715690613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,4,power_law_1.2,0.11200640201568604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,64,balanced,0.035589332381884255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,64,balanced,0.03563733398914337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,64,power_law_1.01,0.035206401348114015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,64,power_law_1.01,0.03640320003032684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,64,power_law_1.2,0.034092798829078674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,64,power_law_1.2,0.034176000952720643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,8,balanced,0.06083733340104421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,8,balanced,0.06089066465695699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,8,power_law_1.01,0.07987840175628662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,8,power_law_1.01,0.08795520067214965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,8,power_law_1.2,0.08232960104942322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,1,8,power_law_1.2,0.08650239706039428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,16,1,balanced,0.09462933739026387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,16,1,balanced,0.09501866499582927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,16,1,power_law_1.01,0.08663679957389832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,16,1,power_law_1.01,0.08723840117454529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,16,1,power_law_1.2,0.08055040240287781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,16,1,power_law_1.2,0.08103039860725403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,2,1,balanced,0.14416533708572388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,2,1,balanced,0.14467733105023703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,2,1,power_law_1.01,0.12459520101547242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,2,1,power_law_1.01,0.125164794921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,2,1,power_law_1.2,0.11855360269546508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,2,1,power_law_1.2,0.1211967945098877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,32,1,balanced,0.08678932984670003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,32,1,balanced,0.08679999907811482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,32,1,power_law_1.01,0.07953919768333435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,32,1,power_law_1.01,0.08266879916191101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,32,1,power_law_1.2,0.07369599938392639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,32,1,power_law_1.2,0.07525119781494141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,4,1,balanced,0.09215999643007915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,4,1,balanced,0.09262933333714803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,4,1,power_law_1.01,0.08544639945030212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,4,1,power_law_1.01,0.086080002784729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,4,1,power_law_1.2,0.08072320222854615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,4,1,power_law_1.2,0.08102399706840516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,8,1,balanced,0.11953066786130269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,8,1,balanced,0.11983467141787212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,8,1,power_law_1.01,0.10768640041351318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,8,1,power_law_1.01,0.10821759700775146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,8,1,power_law_1.2,0.09670400023460388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,2688,1856,6,128,8,1,power_law_1.2,0.09887359738349914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,1,balanced,0.28519999980926514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,1,balanced,0.2858240008354187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,1,power_law_1.01,0.2828416109085083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,1,power_law_1.01,0.28318080902099607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,1,power_law_1.2,0.27806079387664795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,1,power_law_1.2,0.28129920959472654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,128,balanced,0.033258666594823204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,128,balanced,0.033626665671666466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,128,power_law_1.01,0.03240959942340851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,128,power_law_1.01,0.03250559866428375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,128,power_law_1.2,0.03249920010566711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,128,power_law_1.2,0.03264000117778778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,16,balanced,0.04550399879614512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,16,balanced,0.04584533472855886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,16,power_law_1.01,0.09543039798736572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,16,power_law_1.01,0.09619839787483216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,16,power_law_1.2,0.0936896026134491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,16,power_law_1.2,0.09550719857215881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,2,balanced,0.16745599110921225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,2,balanced,0.16941867272059122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,2,power_law_1.01,0.19067519903182983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,2,power_law_1.01,0.20739200115203857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,2,power_law_1.2,0.17352319955825807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,2,power_law_1.2,0.17910399436950683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,256,balanced,0.03177600105603536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,256,balanced,0.033471999069054924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,256,power_law_1.01,0.0315200001001358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,256,power_law_1.01,0.03155199885368347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,256,power_law_1.2,0.03196159899234772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,256,power_law_1.2,0.032543998956680295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,32,balanced,0.033359999457995095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,32,balanced,0.03538133452335993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,32,power_law_1.01,0.06021760106086731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,32,power_law_1.01,0.06046079993247986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,32,power_law_1.2,0.05994240045547485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,32,power_law_1.2,0.060575997829437254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,4,balanced,0.1020853320757548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,4,balanced,0.10488532980283101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,4,power_law_1.01,0.1547968029975891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,4,power_law_1.01,0.157695996761322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,4,power_law_1.2,0.13559679985046386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,4,power_law_1.2,0.13968000411987305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,64,balanced,0.033439998825391136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,64,balanced,0.03400533397992452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,64,power_law_1.01,0.04476799964904785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,64,power_law_1.01,0.046489599347114566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,64,power_law_1.2,0.044844800233840944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,64,power_law_1.2,0.045900800824165346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,8,balanced,0.06182933350404104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,8,balanced,0.06237333516279856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,8,power_law_1.01,0.12248320579528808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,8,power_law_1.01,0.12768640518188476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,8,power_law_1.2,0.11526399850845337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,1,8,power_law_1.2,0.12048640251159667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,16,1,balanced,0.051957334081331887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,16,1,balanced,0.05284800132115682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,16,1,power_law_1.01,0.051551997661590576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,16,1,power_law_1.01,0.051795202493667605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,16,1,power_law_1.2,0.05133439898490906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,16,1,power_law_1.2,0.051718401908874514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,2,1,balanced,0.16250666975975037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,2,1,balanced,0.1660533348719279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,2,1,power_law_1.01,0.1590783953666687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,2,1,power_law_1.01,0.1596735954284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,2,1,power_law_1.2,0.1523519992828369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,2,1,power_law_1.2,0.1534335970878601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,32,1,balanced,0.04596266647179922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,32,1,balanced,0.047295997540156044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,32,1,power_law_1.01,0.04676479995250702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,32,1,power_law_1.01,0.04696959853172302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,32,1,power_law_1.2,0.0460671991109848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,32,1,power_law_1.2,0.04657280147075653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,4,1,balanced,0.09844799836476643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,4,1,balanced,0.09912533561388652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,4,1,power_law_1.01,0.09507840275764465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,4,1,power_law_1.01,0.0958079993724823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,4,1,power_law_1.2,0.09347839951515198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,4,1,power_law_1.2,0.09382399916648865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,8,1,balanced,0.06821333368619283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,8,1,balanced,0.07037333150704701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,8,1,power_law_1.01,0.06753919720649719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,8,1,power_law_1.01,0.06815999746322632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,8,1,power_law_1.2,0.06575359702110291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,3072,1536,8,256,8,1,power_law_1.2,0.06636160016059875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,1,balanced,0.476581335067749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,1,balanced,0.478549321492513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,1,power_law_1.01,0.4235519886016846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,1,power_law_1.01,0.4676032066345215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,1,power_law_1.2,0.47379841804504397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,1,power_law_1.2,0.47675518989562987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,2,balanced,0.24741333723068237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,2,balanced,0.24778666098912558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,2,power_law_1.01,0.2363584041595459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,2,power_law_1.01,0.23802239894866944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,2,power_law_1.2,0.2400576114654541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,2,power_law_1.2,0.2448575973510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,4,balanced,0.170799990495046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,4,balanced,0.17112533251444498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,4,power_law_1.01,0.15918079614639283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,4,power_law_1.01,0.1609984040260315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,4,power_law_1.2,0.159660804271698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,4,power_law_1.2,0.16059520244598388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,8,balanced,0.11132799585660298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,8,balanced,0.11545067032178243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,8,power_law_1.01,0.11040639877319336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,8,power_law_1.01,0.11052800416946411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,8,power_law_1.2,0.10929919481277466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,1,8,power_law_1.2,0.11063679456710815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,16,1,balanced,0.05595199763774872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,16,1,balanced,0.05634133517742157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,16,1,power_law_1.01,0.05182719826698303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,16,1,power_law_1.01,0.053235197067260744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,16,1,power_law_1.2,0.0506816029548645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,16,1,power_law_1.2,0.05267840027809143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,2,1,balanced,0.2529173294703166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,2,1,balanced,0.25519466400146484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,2,1,power_law_1.01,0.2314687967300415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,2,1,power_law_1.01,0.2508928060531616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,2,1,power_law_1.2,0.25591681003570554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,2,1,power_law_1.2,0.2683327913284302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,32,1,balanced,0.03573333223660787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,32,1,balanced,0.039290666580200195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,32,1,power_law_1.01,0.03403519988059998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,32,1,power_law_1.01,0.03549439907073974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,32,1,power_law_1.2,0.03511039912700653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,32,1,power_law_1.2,0.03527039885520935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,4,1,balanced,0.146997332572937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,4,1,balanced,0.15787200133005777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,4,1,power_law_1.01,0.1223680019378662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,4,1,power_law_1.01,0.13482240438461304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,4,1,power_law_1.2,0.13498239517211913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,4,1,power_law_1.2,0.13608319759368898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,8,1,balanced,0.09550399581591289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,8,1,balanced,0.09828266501426697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,8,1,power_law_1.01,0.08107519745826722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,8,1,power_law_1.01,0.08293759822845459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,8,1,power_law_1.2,0.08293759822845459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,14336,2,8,8,1,power_law_1.2,0.08460800051689148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,1,balanced,0.38489067554473877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,1,balanced,0.3861226638158162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,1,power_law_1.01,0.29101440906524656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,1,power_law_1.01,0.2924544095993042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,1,power_law_1.2,0.2636607885360718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,1,power_law_1.2,0.26625919342041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,128,balanced,0.0352960005402565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,128,balanced,0.0374293327331543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,128,power_law_1.01,0.0344895988702774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,128,power_law_1.01,0.034796801209449765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,128,power_law_1.2,0.03450239896774292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,128,power_law_1.2,0.03505919873714447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,16,balanced,0.05635733405749003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,16,balanced,0.057130664587020874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,16,power_law_1.01,0.06830719709396363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,16,power_law_1.01,0.07462400197982788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,16,power_law_1.2,0.06622080206871032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,16,power_law_1.2,0.06878719925880432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,2,balanced,0.21581333875656128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,2,balanced,0.21733866135279337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,2,power_law_1.01,0.19440000057220458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,2,power_law_1.01,0.19622399806976318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,2,power_law_1.2,0.16544640064239502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,2,power_law_1.2,0.16833280324935912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,32,balanced,0.03934400031963984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,32,balanced,0.0414986660083135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,32,power_law_1.01,0.04917759895324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,32,power_law_1.01,0.05046399831771851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,32,power_law_1.2,0.04709759950637817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,32,power_law_1.2,0.050297600030899045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,4,balanced,0.12525332967440286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,4,balanced,0.12942399581273398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,4,power_law_1.01,0.12778240442276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,4,power_law_1.01,0.15489920377731323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,4,power_law_1.2,0.1256832003593445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,4,power_law_1.2,0.14753279685974122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,64,balanced,0.035375999907652535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,64,balanced,0.03555200000603994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,64,power_law_1.01,0.036185601353645326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,64,power_law_1.01,0.038073599338531494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,64,power_law_1.2,0.03733119964599609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,64,power_law_1.2,0.03804160058498383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,8,balanced,0.07846400141716003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,8,balanced,0.08067200084527333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,8,power_law_1.01,0.09325439929962158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,8,power_law_1.01,0.11675519943237304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,8,power_law_1.2,0.09695360064506531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,1,8,power_law_1.2,0.10180480480194092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,16,1,balanced,0.07258666555086772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,16,1,balanced,0.07259733478228252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,16,1,power_law_1.01,0.05942400097846985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,16,1,power_law_1.01,0.061260801553726194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,16,1,power_law_1.2,0.05419520139694214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,16,1,power_law_1.2,0.05495679974555969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,2,1,balanced,0.2100586692492167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,2,1,balanced,0.21793599923451742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,2,1,power_law_1.01,0.16310399770736694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,2,1,power_law_1.01,0.16588159799575805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,2,1,power_law_1.2,0.1565888047218323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,2,1,power_law_1.2,0.1576192021369934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,32,1,balanced,0.0620959997177124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,32,1,balanced,0.06214933097362518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,32,1,power_law_1.01,0.05445759892463684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,32,1,power_law_1.01,0.05498239994049072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,32,1,power_law_1.2,0.051609599590301515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,32,1,power_law_1.2,0.05167359709739685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,4,1,balanced,0.12677866220474243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,4,1,balanced,0.12757333119710287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,4,1,power_law_1.01,0.10776959657669068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,4,1,power_law_1.01,0.1091007947921753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,4,1,power_law_1.2,0.10567679405212402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,4,1,power_law_1.2,0.10657919645309448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,8,1,balanced,0.0918933351834615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,8,1,balanced,0.09225599964459737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,8,1,power_law_1.01,0.07434880137443542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,8,1,power_law_1.01,0.07662720084190369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,8,1,power_law_1.2,0.0688256025314331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,1536,8,128,8,1,power_law_1.2,0.07160959839820862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,1,balanced,1.6675039927164714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,1,balanced,1.6720213890075684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,1,power_law_1.01,1.4981056213378907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,1,power_law_1.01,1.5100416183471679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,1,power_law_1.2,1.3380415916442872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,1,power_law_1.2,1.3675583839416503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,128,balanced,0.0701333334048589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,128,balanced,0.0703306645154953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,128,power_law_1.01,0.07415040135383606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,128,power_law_1.01,0.077920001745224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,128,power_law_1.2,0.07002879977226258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,128,power_law_1.2,0.07471359968185425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,16,balanced,0.2009119987487793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,16,balanced,0.20323199033737183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,16,power_law_1.01,0.34328958988189695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,16,power_law_1.01,0.34552319049835206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,16,power_law_1.2,0.3445888042449951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,16,power_law_1.2,0.3457535982131958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,2,balanced,0.8847839832305908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,2,balanced,0.888474702835083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,2,power_law_1.01,0.9177087783813477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,2,power_law_1.01,0.9209024429321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,2,power_law_1.2,0.8337216377258301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,2,power_law_1.2,0.8541824340820312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,256,balanced,0.06015466650327047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,256,balanced,0.06065600117047628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,256,power_law_1.01,0.056377601623535153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,256,power_law_1.01,0.05868160128593445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,256,power_law_1.2,0.0582144021987915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,256,power_law_1.2,0.05875840187072754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,32,balanced,0.15435733397801718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,32,balanced,0.15533333023389181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,32,power_law_1.01,0.2020672082901001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,32,power_law_1.01,0.20209920406341553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,32,power_law_1.2,0.20062079429626464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,32,power_law_1.2,0.20223360061645507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,4,balanced,0.4904959996541341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,4,balanced,0.495471994082133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,4,power_law_1.01,0.5903935909271241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,4,power_law_1.01,0.6631552219390869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,4,power_law_1.2,0.5986944198608398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,4,power_law_1.2,0.6395648002624512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,64,balanced,0.1109920044740041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,64,balanced,0.11202667156855266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,64,power_law_1.01,0.1219648003578186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,64,power_law_1.01,0.12264959812164307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,64,power_law_1.2,0.11872639656066894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,64,power_law_1.2,0.12319999933242798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,8,balanced,0.30024532477060956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,8,balanced,0.3019146720568339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,8,power_law_1.01,0.47096958160400393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,8,power_law_1.01,0.49297919273376467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,8,power_law_1.2,0.45394558906555177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,1,8,power_law_1.2,0.4737919807434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,16,1,balanced,0.5123039881388346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,16,1,balanced,0.513871987660726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,16,1,power_law_1.01,0.4499839782714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,16,1,power_law_1.01,0.4597760200500488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,16,1,power_law_1.2,0.40523519515991213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,16,1,power_law_1.2,0.40572161674499513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,2,1,balanced,0.8565920193990072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,2,1,balanced,0.8567306995391846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,2,1,power_law_1.01,0.7600255966186523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,2,1,power_law_1.01,0.7714303970336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,2,1,power_law_1.2,0.6983295917510987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,2,1,power_law_1.2,0.7142144203186035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,32,1,balanced,0.4284213383992513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,32,1,balanced,0.4289066791534424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,32,1,power_law_1.01,0.38435840606689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,32,1,power_law_1.01,0.3882816076278687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,32,1,power_law_1.2,0.331328010559082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,32,1,power_law_1.2,0.341593599319458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,4,1,balanced,0.504805326461792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,4,1,balanced,0.5066506862640381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,4,1,power_law_1.01,0.46120319366455076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,4,1,power_law_1.01,0.47135357856750487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,4,1,power_law_1.2,0.41214718818664553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,4,1,power_law_1.2,0.41587200164794924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,8,1,balanced,0.29920534292856854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,8,1,balanced,0.30001066128412884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,8,1,power_law_1.01,0.25883519649505615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,8,1,power_law_1.01,0.26447999477386475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,8,1,power_law_1.2,0.24530560970306398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,4096,2688,22,512,8,1,power_law_1.2,0.24712960720062255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,1,balanced,0.7155360380808512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,1,balanced,0.7457919915517172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,1,power_law_1.01,0.6929920196533204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,1,power_law_1.01,0.7179391860961915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,1,power_law_1.2,0.6976319789886475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,1,power_law_1.2,0.7002367973327637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,2,balanced,0.37748265266418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,2,balanced,0.40070398648579914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,2,power_law_1.01,0.34481918811798096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,2,power_law_1.01,0.3752703905105591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,2,power_law_1.2,0.3753664016723633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,2,power_law_1.2,0.37747199535369874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,4,balanced,0.22566932439804077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,4,balanced,0.23121599356333414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,4,power_law_1.01,0.22176640033721923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,4,power_law_1.01,0.22310400009155273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,4,power_law_1.2,0.22658560276031495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,4,power_law_1.2,0.24460160732269287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,8,balanced,0.15131200353304544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,8,balanced,0.15311466654141745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,8,power_law_1.01,0.15127040147781373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,8,power_law_1.01,0.15151360034942626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,8,power_law_1.2,0.1512768030166626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,1,8,power_law_1.2,0.1531391978263855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,16,1,balanced,0.07062399884064992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,16,1,balanced,0.07188266515731812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,16,1,power_law_1.01,0.06714239716529846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,16,1,power_law_1.01,0.06910719871520996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,16,1,power_law_1.2,0.0686079978942871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,16,1,power_law_1.2,0.06933119893074036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,2,1,balanced,0.37223466237386066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,2,1,balanced,0.4059520165125529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,2,1,power_law_1.01,0.3661952018737793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,2,1,power_law_1.01,0.3736576080322266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,2,1,power_law_1.2,0.3616767883300781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,2,1,power_law_1.2,0.36426239013671874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,32,1,balanced,0.05342400074005127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,32,1,balanced,0.05397333204746246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,32,1,power_law_1.01,0.049728000164031984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,32,1,power_law_1.01,0.050988799333572386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,32,1,power_law_1.2,0.05030400156974792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,32,1,power_law_1.2,0.05055360198020935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,4,1,balanced,0.21387734015782675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,4,1,balanced,0.23012266556421915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,4,1,power_law_1.01,0.20429439544677735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,4,1,power_law_1.01,0.21191680431365967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,4,1,power_law_1.2,0.210099196434021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,4,1,power_law_1.2,0.21217920780181884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,8,1,balanced,0.12811733285586038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,8,1,balanced,0.13946666320165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,8,1,power_law_1.01,0.1232192039489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,8,1,power_law_1.01,0.12376960515975952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,8,1,power_law_1.2,0.13144320249557495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,16384,2,8,8,1,power_law_1.2,0.13621120452880858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,1,balanced,0.7075680096944174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,1,balanced,0.7232853571573893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,1,power_law_1.01,0.7038784027099609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,1,power_law_1.01,0.7047423839569091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,1,power_law_1.2,0.7044608116149902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,1,power_law_1.2,0.7072192192077636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,128,balanced,0.041984001795450844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,128,balanced,0.04349866509437561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,128,power_law_1.01,0.05915520191192627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,128,power_law_1.01,0.05947520136833191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,128,power_law_1.2,0.05159040093421936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,128,power_law_1.2,0.05930240154266357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,16,balanced,0.07974933087825775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,16,balanced,0.08104533453782399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,16,power_law_1.01,0.2158655881881714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,16,power_law_1.01,0.21748480796813965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,16,power_law_1.2,0.2162559986114502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,16,power_law_1.2,0.21713919639587403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,2,balanced,0.3747946818669637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,2,balanced,0.37730133533477783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,2,power_law_1.01,0.4364736080169678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,2,power_law_1.01,0.45240321159362795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,2,power_law_1.2,0.42371840476989747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,2,power_law_1.2,0.4559807777404785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,256,balanced,0.04417600234349569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,256,balanced,0.04533866544564565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,256,power_law_1.01,0.041503998637199405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,256,power_law_1.01,0.04271360039710999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,256,power_law_1.2,0.0414463996887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,256,power_law_1.2,0.04336639940738678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,32,balanced,0.06090133388837179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,32,balanced,0.06178133189678192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,32,power_law_1.01,0.1331071972846985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,32,power_law_1.01,0.135916805267334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,32,power_law_1.2,0.13468159437179567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,32,power_law_1.2,0.13564159870147705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,4,balanced,0.21779733896255493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,4,balanced,0.21823465824127197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,4,power_law_1.01,0.351091194152832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,4,power_law_1.01,0.35304319858551025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,4,power_law_1.2,0.2985471963882446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,4,power_law_1.2,0.33381760120391846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,64,balanced,0.04379733403523763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,64,balanced,0.0458186666170756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,64,power_law_1.01,0.07694720029830933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,64,power_law_1.01,0.07705600261688232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,64,power_law_1.2,0.07133439779281617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,64,power_law_1.2,0.072953599691391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,8,balanced,0.13793067137400308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,8,balanced,0.13869333267211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,8,power_law_1.01,0.2700671911239624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,8,power_law_1.01,0.30870399475097654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,8,power_law_1.2,0.2578752040863037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,1,8,power_law_1.2,0.2621248006820679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,16,1,balanced,0.09533333778381348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,16,1,balanced,0.09542933106422424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,16,1,power_law_1.01,0.09299200177192687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,16,1,power_law_1.01,0.09415040016174317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,16,1,power_law_1.2,0.09099519848823548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,16,1,power_law_1.2,0.09106559753417968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,2,1,balanced,0.37243199348449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,2,1,balanced,0.37477866808573407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,2,1,power_law_1.01,0.3733567953109741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,2,1,power_law_1.01,0.3737215995788574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,2,1,power_law_1.2,0.3620287895202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,2,1,power_law_1.2,0.36579198837280275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,32,1,balanced,0.0824480007092158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,32,1,balanced,0.08270399769147237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,32,1,power_law_1.01,0.08061439990997314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,32,1,power_law_1.01,0.0810368001461029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,32,1,power_law_1.2,0.08058239817619324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,32,1,power_law_1.2,0.08071039915084839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,4,1,balanced,0.2223893404006958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,4,1,balanced,0.22300799687703451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,4,1,power_law_1.01,0.21992959976196289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,4,1,power_law_1.01,0.22617599964141846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,4,1,power_law_1.2,0.21166720390319824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,4,1,power_law_1.2,0.2166208028793335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,8,1,balanced,0.14545599619547525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,8,1,balanced,0.14986133575439453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,8,1,power_law_1.01,0.1472000002861023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,8,1,power_law_1.01,0.149510395526886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,8,1,power_law_1.2,0.14082560539245606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2048,8,256,8,1,power_law_1.2,0.14309120178222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,1,balanced,0.8731839656829834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,1,balanced,0.8763733704884847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,1,power_law_1.01,0.7341887950897217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,1,power_law_1.01,0.7566783905029297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,1,power_law_1.2,0.6642752170562745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,1,power_law_1.2,0.6648128032684326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,16,balanced,0.08673600355784099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,16,balanced,0.08693333466847737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,16,power_law_1.01,0.16915839910507202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,16,power_law_1.01,0.16951040029525757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,16,power_law_1.2,0.16543359756469728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,16,power_law_1.2,0.16832000017166138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,2,balanced,0.4572800000508626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,2,balanced,0.4582773447036743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,2,power_law_1.01,0.4197696208953857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,2,power_law_1.01,0.4528319835662842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,2,power_law_1.2,0.3971519947052002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,2,power_law_1.2,0.4487616062164307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,32,balanced,0.06348266700903575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,32,balanced,0.06524266799290974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,32,power_law_1.01,0.09326080083847046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,32,power_law_1.01,0.10017919540405273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,32,power_law_1.2,0.08695039749145508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,32,power_law_1.2,0.08696960210800171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,4,balanced,0.24858667453130087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,4,balanced,0.2507893244425456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,4,power_law_1.01,0.29322240352630613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,4,power_law_1.01,0.30208001136779783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,4,power_law_1.2,0.2770751953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,4,power_law_1.2,0.3495935916900635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,8,balanced,0.14801067113876343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,8,balanced,0.1481013298034668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,8,power_law_1.01,0.24318718910217285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,8,power_law_1.01,0.24652159214019775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,8,power_law_1.2,0.21982719898223876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,1,8,power_law_1.2,0.23094398975372316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,16,1,balanced,0.12019733587900798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,16,1,balanced,0.1202826698621114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,16,1,power_law_1.01,0.10234240293502808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,16,1,power_law_1.01,0.10291839838027954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,16,1,power_law_1.2,0.0937279999256134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,16,1,power_law_1.2,0.09489920139312744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,2,1,balanced,0.45583999156951904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,2,1,balanced,0.4559146563212077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,2,1,power_law_1.01,0.38103039264678956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,2,1,power_law_1.01,0.3943615913391113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,2,1,power_law_1.2,0.3403968095779419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,2,1,power_law_1.2,0.3502336025238037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,32,1,balanced,0.09299199779828389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,32,1,balanced,0.09461333354314168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,32,1,power_law_1.01,0.08289920091629029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,32,1,power_law_1.01,0.0853056013584137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,32,1,power_law_1.2,0.07573760151863099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,32,1,power_law_1.2,0.07831040024757385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,4,1,balanced,0.25913600126902264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,4,1,balanced,0.273418664932251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,4,1,power_law_1.01,0.2239743947982788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,4,1,power_law_1.01,0.22736001014709473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,4,1,power_law_1.2,0.20594561100006104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,4,1,power_law_1.2,0.21558399200439454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,8,1,balanced,0.16777066389719644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,8,1,balanced,0.16876800855000815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,8,1,power_law_1.01,0.14923520088195802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,8,1,power_law_1.01,0.15345920324325563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,8,1,power_law_1.2,0.13367680311203003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,6144,2560,8,160,8,1,power_law_1.2,0.13390079736709595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,1,balanced,0.8197866280873617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,1,balanced,0.8212693532307943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,1,power_law_1.01,0.8187520027160644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,1,power_law_1.01,0.8194944381713867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,1,power_law_1.2,0.8184127807617188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,1,power_law_1.2,0.8189824104309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,128,balanced,0.0496373325586319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,128,balanced,0.0499893327554067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,128,power_law_1.01,0.0631168007850647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,128,power_law_1.01,0.06376320123672485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,128,power_law_1.2,0.06106240153312683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,128,power_law_1.2,0.06416000127792358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,16,balanced,0.09059733152389526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,16,balanced,0.09233066439628601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,16,power_law_1.01,0.23157761096954346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,16,power_law_1.01,0.2493311882019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,16,power_law_1.2,0.24542078971862794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,16,power_law_1.2,0.24583039283752442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,2,balanced,0.43252265453338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,2,balanced,0.4339786767959595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,2,power_law_1.01,0.5303552150726318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,2,power_law_1.01,0.5342080116271972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,2,power_law_1.2,0.4872576236724854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,2,power_law_1.2,0.5150784015655517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,256,balanced,0.04971733192602793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,256,balanced,0.05162133276462555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,256,power_law_1.01,0.04892799854278564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,256,power_law_1.01,0.04997119903564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,256,power_law_1.2,0.04890879988670349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,256,power_law_1.2,0.05022720098495483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,32,balanced,0.06559999783833821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,32,balanced,0.06605866551399231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,32,power_law_1.01,0.15418239831924438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,32,power_law_1.01,0.1565440058708191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,32,power_law_1.2,0.15683200359344482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,32,power_law_1.2,0.15729279518127443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,4,balanced,0.2498133381207784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,4,balanced,0.25040000677108765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,4,power_law_1.01,0.373036789894104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,4,power_law_1.01,0.3881472110748291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,4,power_law_1.2,0.38594560623168944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,4,power_law_1.2,0.39029760360717775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,64,balanced,0.04995200037956238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,64,balanced,0.051589335004488625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,64,power_law_1.01,0.08525440096855164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,64,power_law_1.01,0.08906880021095276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,64,power_law_1.2,0.08325120210647582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,64,power_law_1.2,0.08529919981956482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,8,balanced,0.15642666816711426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,8,balanced,0.16568533579508463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,8,power_law_1.01,0.285427188873291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,8,power_law_1.01,0.30376319885253905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,8,power_law_1.2,0.2921152114868164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,1,8,power_law_1.2,0.31784958839416505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,16,1,balanced,0.10847999652226765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,16,1,balanced,0.10886399944623311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,16,1,power_law_1.01,0.10606080293655396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,16,1,power_law_1.01,0.10631680488586426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,16,1,power_law_1.2,0.10396800041198731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,16,1,power_law_1.2,0.10410239696502685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,2,1,balanced,0.43144532044728595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,2,1,balanced,0.4488319953282674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,2,1,power_law_1.01,0.4277376174926758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,2,1,power_law_1.01,0.4327360153198242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,2,1,power_law_1.2,0.41838722229003905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,2,1,power_law_1.2,0.42124161720275877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,32,1,balanced,0.09427199761072795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,32,1,balanced,0.09464533130327861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,32,1,power_law_1.01,0.0923520028591156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,32,1,power_law_1.01,0.09256960153579712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,32,1,power_law_1.2,0.0914687991142273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,32,1,power_law_1.2,0.09171839952468872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,4,1,balanced,0.2549813389778137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,4,1,balanced,0.28339733680089313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,4,1,power_law_1.01,0.2535936117172241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,4,1,power_law_1.01,0.2547327995300293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,4,1,power_law_1.2,0.24766719341278076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,4,1,power_law_1.2,0.24854400157928466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,8,1,balanced,0.17303466796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,8,1,balanced,0.17337065935134888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,8,1,power_law_1.01,0.16736639738082887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,8,1,power_law_1.01,0.17472000122070314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,8,1,power_law_1.2,0.15829119682312012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,256,8,1,power_law_1.2,0.1638592004776001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,1,balanced,0.8209333419799805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,1,balanced,0.8245600064595541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,1,power_law_1.01,0.819660758972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,1,power_law_1.01,0.8203264236450195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,1,power_law_1.2,0.8201600074768066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,1,power_law_1.2,0.8217920303344727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,128,balanced,0.04961066444714864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,128,balanced,0.05022400120894114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,128,power_law_1.01,0.07121279835700989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,128,power_law_1.01,0.0713536024093628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,128,power_law_1.2,0.07137920260429383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,128,power_law_1.2,0.07171840071678162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,16,balanced,0.09085333347320557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,16,balanced,0.0918346643447876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,16,power_law_1.01,0.33118720054626466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,16,power_law_1.01,0.33956480026245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,16,power_law_1.2,0.32508800029754636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,16,power_law_1.2,0.337990403175354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,2,balanced,0.4349600076675415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,2,balanced,0.4495199918746948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,2,power_law_1.01,0.5723584175109864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,2,power_law_1.01,0.6116928100585938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,2,power_law_1.2,0.5873280048370362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,2,power_law_1.2,0.601478385925293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,32,balanced,0.06458666423956554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,32,balanced,0.06597866614659627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,32,power_law_1.01,0.18549760580062866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,32,power_law_1.01,0.18562560081481932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,32,power_law_1.2,0.18554879426956178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,32,power_law_1.2,0.1862912058830261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,4,balanced,0.2498826583226522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,4,balanced,0.2502453327178955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,4,power_law_1.01,0.4302720069885254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,4,power_law_1.01,0.4411327838897705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,4,power_law_1.2,0.44471039772033694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,4,power_law_1.2,0.46894078254699706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,64,balanced,0.05132266879081726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,64,balanced,0.053818667928377785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,64,power_law_1.01,0.10763520002365112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,64,power_law_1.01,0.10851839780807496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,64,power_law_1.2,0.10785280466079712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,64,power_law_1.2,0.10812159776687622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,8,balanced,0.1525973379611969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,8,balanced,0.1597653329372406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,8,power_law_1.01,0.3643584012985229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,8,power_law_1.01,0.36725759506225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,8,power_law_1.2,0.333407998085022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,1,8,power_law_1.2,0.3621056079864502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,16,1,balanced,0.10693333546320598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,16,1,balanced,0.10878400007883708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,16,1,power_law_1.01,0.1066815972328186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,16,1,power_law_1.01,0.10701440572738648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,16,1,power_law_1.2,0.10625280141830444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,16,1,power_law_1.2,0.10639359951019287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,2,1,balanced,0.43010131518046063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,2,1,balanced,0.4328106641769409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,2,1,power_law_1.01,0.4300864219665527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,2,1,power_law_1.01,0.43029122352600097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,2,1,power_law_1.2,0.42828798294067383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,2,1,power_law_1.2,0.4287871837615967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,32,1,balanced,0.09289066990216573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,32,1,balanced,0.09479999542236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,32,1,power_law_1.01,0.0925055980682373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,32,1,power_law_1.01,0.09274880290031433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,32,1,power_law_1.2,0.09265279769897461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,32,1,power_law_1.2,0.0929472029209137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,4,1,balanced,0.25805334250132245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,4,1,balanced,0.2755039930343628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,4,1,power_law_1.01,0.25410559177398684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,4,1,power_law_1.01,0.2548223972320557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,4,1,power_law_1.2,0.2541311979293823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,4,1,power_law_1.2,0.25559680461883544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,8,1,balanced,0.16894400119781494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,8,1,balanced,0.17292799552281699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,8,1,power_law_1.01,0.1669376015663147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,8,1,power_law_1.01,0.17087359428405763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,8,1,power_law_1.2,0.16817920207977294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8,7168,2048,8,384,8,1,power_law_1.2,0.16970880031585694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,1,balanced,0.2091360092163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,1,balanced,0.2097813288370768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,1,power_law_1.01,0.19278080463409425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,1,power_law_1.01,0.19390079975128174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,1,power_law_1.2,0.1978495955467224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,1,power_law_1.2,0.20094079971313478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,128,balanced,0.03730133424202601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,128,balanced,0.03932266682386398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,128,power_law_1.01,0.036083200573921205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,128,power_law_1.01,0.03649280071258545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,128,power_law_1.2,0.035769599676132205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,128,power_law_1.2,0.03596799969673157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,16,balanced,0.048197334011395775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,16,balanced,0.048325334986050926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,16,power_law_1.01,0.043647998571395875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,16,power_law_1.01,0.04705280065536499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,16,power_law_1.2,0.040428799390792844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,16,power_law_1.2,0.04407039880752563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,2,balanced,0.1441439986228943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,2,balanced,0.1544266641139984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,2,power_law_1.01,0.1355712056159973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,2,power_law_1.01,0.13764480352401734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,2,power_law_1.2,0.14096640348434447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,2,power_law_1.2,0.1411967992782593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,32,balanced,0.037920000652472176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,32,balanced,0.039488000174363456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,32,power_law_1.01,0.03672960102558136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,32,power_law_1.01,0.03681919872760773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,32,power_law_1.2,0.03681919872760773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,32,power_law_1.2,0.03687680065631867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,4,balanced,0.0820853312810262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,4,balanced,0.08223466575145721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,4,power_law_1.01,0.076665598154068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,4,power_law_1.01,0.07714560031890869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,4,power_law_1.2,0.07763199806213379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,4,power_law_1.2,0.0790336012840271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,64,balanced,0.03748266647259394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,64,balanced,0.03751466671625773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,64,power_law_1.01,0.03607679903507233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,64,power_law_1.01,0.03653120100498199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,64,power_law_1.2,0.03633280098438263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,64,power_law_1.2,0.03686400055885315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,8,balanced,0.06214933097362518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,8,balanced,0.06323733429114024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,8,power_law_1.01,0.059539198875427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,8,power_law_1.01,0.060575997829437254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,8,power_law_1.2,0.060678398609161376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,1,8,power_law_1.2,0.06082559823989868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,2,1,balanced,0.14401599764823914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,2,1,balanced,0.1458399991194407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,2,1,power_law_1.01,0.1364159941673279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,2,1,power_law_1.01,0.13668479919433593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,2,1,power_law_1.2,0.1366719961166382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,2,1,power_law_1.2,0.13927680253982544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,4,1,balanced,0.08402132987976074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,4,1,balanced,0.08481599887212117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,4,1,power_law_1.01,0.07667199969291687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,4,1,power_law_1.01,0.07711359858512878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,4,1,power_law_1.2,0.07918720245361328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2048,768,8,128,4,1,power_law_1.2,0.07919999957084656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,1,balanced,0.5825440088907877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,1,balanced,0.5849920113881429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,1,power_law_1.01,0.5003520011901855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,1,power_law_1.01,0.5273920059204101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,1,power_law_1.2,0.5078527927398682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,1,power_law_1.2,0.5267583847045898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,128,balanced,0.04752000172932943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,128,balanced,0.047839999198913574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,128,power_law_1.01,0.04556800127029419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,128,power_law_1.01,0.04583039879798889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,128,power_law_1.2,0.04586879909038544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,128,power_law_1.2,0.046105599403381346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,16,balanced,0.08222933113574982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,16,balanced,0.08262933293978374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,16,power_law_1.01,0.07899519801139832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,16,power_law_1.01,0.07955200076103211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,16,power_law_1.2,0.07806079983711242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,16,power_law_1.2,0.07902079820632935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,2,balanced,0.36591466267903644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,2,balanced,0.3659733136494954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,2,power_law_1.01,0.305401611328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,2,power_law_1.01,0.308569598197937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,2,power_law_1.2,0.3018304109573364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,2,power_law_1.2,0.31495680809021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,32,balanced,0.0710506687561671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,32,balanced,0.07197866837183635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,32,power_law_1.01,0.06593279838562012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,32,power_law_1.01,0.06951680183410644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,32,power_law_1.2,0.07007359862327575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,32,power_law_1.2,0.07057920098304749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,4,balanced,0.2055520017941793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,4,balanced,0.20906666914621988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,4,power_law_1.01,0.18732800483703613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,4,power_law_1.01,0.19379199743270875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,4,power_law_1.2,0.19050240516662598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,4,power_law_1.2,0.19800959825515746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,64,balanced,0.047541335225105286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,64,balanced,0.047653332352638245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,64,power_law_1.01,0.04892799854278564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,64,power_law_1.01,0.05249919891357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,64,power_law_1.2,0.04645119905471802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,64,power_law_1.2,0.04855040013790131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,8,balanced,0.11345066626866658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,8,balanced,0.11373866597811381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,8,power_law_1.01,0.10362880229949951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,8,power_law_1.01,0.1084928035736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,8,power_law_1.2,0.10746879577636718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,1,8,power_law_1.2,0.10826239585876465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,16,1,balanced,0.24421334266662598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,16,1,balanced,0.24423466126124063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,16,1,power_law_1.01,0.20814719200134277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,16,1,power_law_1.01,0.21264638900756835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,16,1,power_law_1.2,0.21338880062103271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,16,1,power_law_1.2,0.2196863889694214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,2,1,balanced,0.35418132940928143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,2,1,balanced,0.3582186698913574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,2,1,power_law_1.01,0.29809279441833497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,2,1,power_law_1.01,0.30643200874328613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,2,1,power_law_1.2,0.2977792024612427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,2,1,power_law_1.2,0.3062335968017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,32,1,balanced,0.1972586711247762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,32,1,balanced,0.197434663772583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,32,1,power_law_1.01,0.16210559606552125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,32,1,power_law_1.01,0.16678400039672853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,32,1,power_law_1.2,0.168230402469635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,32,1,power_law_1.2,0.17222399711608888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,4,1,balanced,0.19502399365107217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,4,1,balanced,0.19563732544581094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,4,1,power_law_1.01,0.17828480005264283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,4,1,power_law_1.01,0.17863039970397948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,4,1,power_law_1.2,0.178547203540802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,4,1,power_law_1.2,0.1804352045059204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,8,1,balanced,0.42236800988515216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,8,1,balanced,0.42315733432769775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,8,1,power_law_1.01,0.3510400056838989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,8,1,power_law_1.01,0.36497280597686765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,8,1,power_law_1.2,0.3482687950134277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,2688,1856,6,128,8,1,power_law_1.2,0.3631103992462158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,1,balanced,1.1795360247294109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,1,balanced,1.1971253554026287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,1,power_law_1.01,0.9118271827697754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,1,power_law_1.01,0.9190336227416992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,1,power_law_1.2,0.9102335929870605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,1,power_law_1.2,0.9114815711975097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,128,balanced,0.04796266555786133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,128,balanced,0.05375466744105021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,128,power_law_1.01,0.04737919867038727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,128,power_law_1.01,0.04783360064029694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,128,power_law_1.2,0.048076799511909483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,128,power_law_1.2,0.05141119956970215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,16,balanced,0.11268267035484314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,16,balanced,0.1136799951394399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,16,power_law_1.01,0.09957119822502136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,16,power_law_1.01,0.10402560234069824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,16,power_law_1.2,0.09961599707603455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,16,power_law_1.2,0.10126080513000488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,2,balanced,0.6217386722564697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,2,balanced,0.6264479955037435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,2,power_law_1.01,0.5061376094818115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,2,power_law_1.01,0.5097472190856933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,2,power_law_1.2,0.4906816005706787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,2,power_law_1.2,0.5177279949188233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,256,balanced,0.04794666667779287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,256,balanced,0.04795200129350027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,256,power_law_1.01,0.04622719883918762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,256,power_law_1.01,0.046623998880386354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,256,power_law_1.2,0.04640640020370483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,256,power_law_1.2,0.04734080135822296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,32,balanced,0.08257066706816356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,32,balanced,0.08260799944400787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,32,power_law_1.01,0.07930240035057068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,32,power_law_1.01,0.08030080199241638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,32,power_law_1.2,0.07794560194015503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,32,power_law_1.2,0.0794431984424591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,4,balanced,0.3283466696739197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,4,balanced,0.3322506745656331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,4,power_law_1.01,0.28624639511108396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,4,power_law_1.01,0.29617919921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,4,power_law_1.2,0.29069440364837645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,4,power_law_1.2,0.30611839294433596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,64,balanced,0.06855999926726024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,64,balanced,0.07004266480604808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,64,power_law_1.01,0.06695039868354798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,64,power_law_1.01,0.06880000233650208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,64,power_law_1.2,0.06704000234603882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,64,power_law_1.2,0.06711680293083191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,8,balanced,0.21110934019088745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,8,balanced,0.21411732832590738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,8,power_law_1.01,0.1716096043586731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,8,power_law_1.01,0.20470399856567384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,8,power_law_1.2,0.17756799459457398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,1,8,power_law_1.2,0.17920000553131105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,16,1,balanced,0.12830400466918945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,16,1,balanced,0.1299253304799398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,16,1,power_law_1.01,0.10614399909973145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,16,1,power_law_1.01,0.10641280412673951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,16,1,power_law_1.2,0.10605440139770508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,16,1,power_law_1.2,0.10609279870986939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,2,1,balanced,0.6157813469568888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,2,1,balanced,0.6164480050404867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,2,1,power_law_1.01,0.47712001800537107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,2,1,power_law_1.01,0.48441600799560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,2,1,power_law_1.2,0.4741951942443848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,2,1,power_law_1.2,0.47870721817016604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,32,1,balanced,0.09913067022959392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,32,1,balanced,0.10057600339253743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,32,1,power_law_1.01,0.08547840118408204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,32,1,power_law_1.01,0.08755840063095092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,32,1,power_law_1.2,0.08518400192260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,32,1,power_law_1.2,0.08663039803504943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,4,1,balanced,0.32607465982437134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,4,1,balanced,0.32708799839019775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,4,1,power_law_1.01,0.25932159423828127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,4,1,power_law_1.01,0.26576640605926516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,4,1,power_law_1.2,0.2549760103225708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,4,1,power_law_1.2,0.27644801139831543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,8,1,balanced,0.2112320065498352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,8,1,balanced,0.21187732617060342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,8,1,power_law_1.01,0.1639423966407776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,8,1,power_law_1.01,0.16571520566940307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,8,1,power_law_1.2,0.154476797580719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,3072,1536,8,256,8,1,power_law_1.2,0.16960639953613282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,1,balanced,0.5279733339945475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,1,balanced,0.5383413235346476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,1,power_law_1.01,0.5735616207122802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,1,power_law_1.01,0.58853759765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,1,power_law_1.2,0.5709248065948487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,1,power_law_1.2,0.5790080070495606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,2,balanced,0.3359626531600952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,2,balanced,0.3360053300857544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,2,power_law_1.01,0.37112960815429685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,2,power_law_1.01,0.3899327993392944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,2,power_law_1.2,0.37311999797821044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,2,power_law_1.2,0.3820607900619507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,4,balanced,0.23304533958435059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,4,balanced,0.2397759954134623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,4,power_law_1.01,0.26959359645843506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,4,power_law_1.01,0.2767359972000122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,4,power_law_1.2,0.26657919883728026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,4,power_law_1.2,0.2846848011016846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,8,balanced,0.20188266038894653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,8,balanced,0.20374933878580728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,8,power_law_1.01,0.21287040710449218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,8,power_law_1.01,0.22009599208831787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,8,power_law_1.2,0.21867520809173585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,1,8,power_law_1.2,0.24202880859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,16,1,balanced,0.0731573353211085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,16,1,balanced,0.07435733576615651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,16,1,power_law_1.01,0.07315840125083924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,16,1,power_law_1.01,0.0737600028514862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,16,1,power_law_1.2,0.07386239767074584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,16,1,power_law_1.2,0.07408639788627625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,2,1,balanced,0.27914132674535114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,2,1,balanced,0.28070932626724243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,2,1,power_law_1.01,0.2884416103363037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,2,1,power_law_1.01,0.298361611366272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,2,1,power_law_1.2,0.28215680122375486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,2,1,power_law_1.2,0.2875711917877197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,32,1,balanced,0.057962665955225624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,32,1,balanced,0.06019733349482218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,32,1,power_law_1.01,0.061638402938842776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,32,1,power_law_1.01,0.06178560256958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,32,1,power_law_1.2,0.06104320287704468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,32,1,power_law_1.2,0.06225919723510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,4,1,balanced,0.15075199802716574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,4,1,balanced,0.15239466230074564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,4,1,power_law_1.01,0.15841920375823976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,4,1,power_law_1.01,0.17069439888000487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,4,1,power_law_1.2,0.15381120443344115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,4,1,power_law_1.2,0.16255359649658202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,8,1,balanced,0.10373333096504211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,8,1,balanced,0.10714133580525716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,8,1,power_law_1.01,0.09808639883995056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,8,1,power_law_1.01,0.0985535979270935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,8,1,power_law_1.2,0.09990400075912476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,14336,2,8,8,1,power_law_1.2,0.10012799501419067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,1,balanced,0.8126239776611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,1,balanced,0.8176480134328207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,1,power_law_1.01,0.7325119972229004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,1,power_law_1.01,0.7495488166809082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,1,power_law_1.2,0.767091178894043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,1,power_law_1.2,0.7676352024078369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,128,balanced,0.054042667150497437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,128,balanced,0.05509866774082184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,128,power_law_1.01,0.051500797271728516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,128,power_law_1.01,0.052211201190948485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,128,power_law_1.2,0.052172797918319705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,128,power_law_1.2,0.05242879986763001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,16,balanced,0.09804800152778625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,16,balanced,0.09834667046864827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,16,power_law_1.01,0.09379199743270875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,16,power_law_1.01,0.09463040232658386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,16,power_law_1.2,0.09377920031547546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,16,power_law_1.2,0.09550079703330994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,2,balanced,0.4306559960047404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,2,balanced,0.43144532044728595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,2,power_law_1.01,0.4101439952850342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,2,power_law_1.01,0.4120448112487793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,2,power_law_1.2,0.41376638412475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,2,power_law_1.2,0.4160192012786865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,32,balanced,0.08210666477680206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,32,balanced,0.08272533118724823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,32,power_law_1.01,0.08022400140762329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,32,power_law_1.01,0.08079360127449035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,32,power_law_1.2,0.07944959998130799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,32,power_law_1.2,0.0796992003917694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,4,balanced,0.25516800085703534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,4,balanced,0.25540266434351605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,4,power_law_1.01,0.24593279361724854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,4,power_law_1.01,0.24938879013061524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,4,power_law_1.2,0.25016961097717283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,4,power_law_1.2,0.2535360097885132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,64,balanced,0.0622026671965917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,64,balanced,0.06674666702747345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,64,power_law_1.01,0.06342399716377259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,64,power_law_1.01,0.06622080206871032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,64,power_law_1.2,0.06180480122566223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,64,power_law_1.2,0.06625919938087463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,8,balanced,0.1376426617304484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,8,balanced,0.1386613349119822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,8,power_law_1.01,0.12911360263824462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,8,power_law_1.01,0.13462400436401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,8,power_law_1.2,0.1296064019203186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,1,8,power_law_1.2,0.13342080116271973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,16,1,balanced,0.10293333729108174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,16,1,balanced,0.10528533657391866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,16,1,power_law_1.01,0.09935359954833985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,16,1,power_law_1.01,0.0997759997844696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,16,1,power_law_1.2,0.1001855969429016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,16,1,power_law_1.2,0.10100480318069457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,2,1,balanced,0.3882186810175578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,2,1,balanced,0.3901439905166626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,2,1,power_law_1.01,0.3549952030181885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,2,1,power_law_1.01,0.3573440074920654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,2,1,power_law_1.2,0.36510720252990725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,2,1,power_law_1.2,0.36937599182128905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,32,1,balanced,0.08654399712880452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,32,1,balanced,0.0865760048230489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,32,1,power_law_1.01,0.08218240141868591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,32,1,power_law_1.01,0.08325759768486023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,32,1,power_law_1.2,0.08435840010643006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,32,1,power_law_1.2,0.08439040184020996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,4,1,balanced,0.2550453344980876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,4,1,balanced,0.25548799832661945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,4,1,power_law_1.01,0.24530560970306398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,4,1,power_law_1.01,0.2453376054763794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,4,1,power_law_1.2,0.24467840194702148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,4,1,power_law_1.2,0.24843521118164064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,8,1,balanced,0.1393226683139801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,8,1,balanced,0.1399786671002706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,8,1,power_law_1.01,0.13133440017700196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,8,1,power_law_1.01,0.1315135955810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,8,1,power_law_1.2,0.12996480464935303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,1536,8,128,8,1,power_law_1.2,0.13153280019760133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,1,balanced,5.379621505737305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,1,balanced,5.398933410644531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,1,power_law_1.01,4.553062438964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,1,power_law_1.01,4.578656005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,1,power_law_1.2,4.537491226196289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,1,power_law_1.2,4.575795364379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,128,balanced,0.11741866668065389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,128,balanced,0.1179253359635671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,128,power_law_1.01,0.11475839614868164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,128,power_law_1.01,0.11546880006790161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,128,power_law_1.2,0.1143231987953186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,128,power_law_1.2,0.115065598487854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,16,balanced,0.41445334752400714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,16,balanced,0.4150079886118571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,16,power_law_1.01,0.3472512006759644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,16,power_law_1.01,0.3599168062210083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,16,power_law_1.2,0.35992319583892823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,16,power_law_1.2,0.40200319290161135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,2,balanced,2.726901372273763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,2,balanced,2.7735681533813477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,2,power_law_1.01,2.3408447265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,2,power_law_1.01,2.3586944580078124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,2,power_law_1.2,2.3000192642211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,2,power_law_1.2,2.3788223266601562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,256,balanced,0.1018346647421519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,256,balanced,0.10206400354703267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,256,power_law_1.01,0.10090880393981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,256,power_law_1.01,0.10131200551986694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,256,power_law_1.2,0.10127359628677368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,256,power_law_1.2,0.10173439979553223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,32,balanced,0.2485439976056417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,32,balanced,0.2625386714935303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,32,power_law_1.01,0.22572801113128663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,32,power_law_1.01,0.2307136058807373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,32,power_law_1.2,0.2036736011505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,32,power_law_1.2,0.23041279315948487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,4,balanced,1.402352015177409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,4,balanced,1.4077280362447102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,4,power_law_1.01,1.2032896041870118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,4,power_law_1.01,1.2884672164916993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,4,power_law_1.2,1.2326335906982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,4,power_law_1.2,1.2484992027282715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,64,balanced,0.1478559970855713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,64,balanced,0.14826666315396628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,64,power_law_1.01,0.13924479484558105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,64,power_law_1.01,0.14096640348434447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,64,power_law_1.2,0.13911039829254152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,64,power_law_1.2,0.1484544038772583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,8,balanced,0.7344426314036051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,8,balanced,0.736191987991333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,8,power_law_1.01,0.6592512130737305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,8,power_law_1.01,0.6757952213287354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,8,power_law_1.2,0.6658048152923584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,1,8,power_law_1.2,0.6720191955566406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,16,1,balanced,1.8132692972819011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,16,1,balanced,1.815893332163493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,16,1,power_law_1.01,1.5364224433898925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,16,1,power_law_1.01,1.567852783203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,16,1,power_law_1.2,1.541152000427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,16,1,power_law_1.2,1.5428223609924316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,2,1,balanced,2.4475199381510415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,2,1,balanced,2.4571839968363443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,2,1,power_law_1.01,2.0567935943603515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,2,1,power_law_1.01,2.0922048568725584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,2,1,power_law_1.2,2.0418304443359374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,2,1,power_law_1.2,2.0695423126220702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,32,1,balanced,1.2142079671223958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,32,1,balanced,1.2170506318410237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,32,1,power_law_1.01,1.032102394104004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,32,1,power_law_1.01,1.0328000068664551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,32,1,power_law_1.2,1.0310527801513671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,32,1,power_law_1.2,1.051846408843994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,4,1,balanced,1.3949599266052246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,4,1,balanced,1.3984959920247395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,4,1,power_law_1.01,1.1896063804626464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,4,1,power_law_1.01,1.2032575607299805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,4,1,power_law_1.2,1.1906111717224122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,4,1,power_law_1.2,1.2030271530151366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,8,1,balanced,0.7545066674550375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,8,1,balanced,0.7546292940775553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,8,1,power_law_1.01,0.6496895790100098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,8,1,power_law_1.01,0.6549888134002686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,8,1,power_law_1.2,0.6414015769958497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,4096,2688,22,512,8,1,power_law_1.2,0.6554624080657959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,1,balanced,0.859813372294108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,1,balanced,0.861957311630249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,1,power_law_1.01,0.9364416122436523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,1,power_law_1.01,0.9376192092895508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,1,power_law_1.2,0.9479680061340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,1,power_law_1.2,0.9908864021301269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,2,balanced,0.48604798316955566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,2,balanced,0.5002079804738363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,2,power_law_1.01,0.5686848163604736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,2,power_law_1.01,0.5731008052825928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,2,power_law_1.2,0.5701056003570557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,2,power_law_1.2,0.5807936191558838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,4,balanced,0.3161226709683736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,4,balanced,0.31723199288050336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,4,power_law_1.01,0.37890560626983644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,4,power_law_1.01,0.3803776025772095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,4,power_law_1.2,0.3750272035598755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,4,power_law_1.2,0.41921281814575195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,8,balanced,0.25412799914677936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,8,balanced,0.2562613288561503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,8,power_law_1.01,0.2812096118927002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,8,power_law_1.01,0.28136320114135743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,8,power_law_1.2,0.2831360101699829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,1,8,power_law_1.2,0.3233664035797119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,16,1,balanced,0.10211199522018433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,16,1,balanced,0.10316266616185506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,16,1,power_law_1.01,0.10218240022659301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,16,1,power_law_1.01,0.10226559638977051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,16,1,power_law_1.2,0.10313600301742554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,16,1,power_law_1.2,0.10325759649276733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,2,1,balanced,0.4392000039418538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,2,1,balanced,0.45822401841481525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,2,1,power_law_1.01,0.47121281623840333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,2,1,power_law_1.01,0.4892096042633057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,2,1,power_law_1.2,0.4733439922332764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,2,1,power_law_1.2,0.4888768196105957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,32,1,balanced,0.0885653297106425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,32,1,balanced,0.08861333131790161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,32,1,power_law_1.01,0.08592000007629394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,32,1,power_law_1.01,0.08599039912223816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,32,1,power_law_1.2,0.08506240248680115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,32,1,power_law_1.2,0.08640639781951905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,4,1,balanced,0.2390879988670349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,4,1,balanced,0.24389866987864176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,4,1,power_law_1.01,0.2702143907546997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,4,1,power_law_1.01,0.28200318813323977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,4,1,power_law_1.2,0.2502912044525146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,4,1,power_law_1.2,0.2850752115249634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,8,1,balanced,0.1409119963645935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,8,1,balanced,0.15497066577275595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,8,1,power_law_1.01,0.14142080545425414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,8,1,power_law_1.01,0.14345599412918092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,8,1,power_law_1.2,0.14052480459213257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,16384,2,8,8,1,power_law_1.2,0.14149760007858275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,1,balanced,3.101989428202311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,1,balanced,3.1688000361124673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,1,power_law_1.01,2.4375871658325194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,1,power_law_1.01,2.449772834777832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,1,power_law_1.2,2.401158332824707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,1,power_law_1.2,2.433247947692871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,128,balanced,0.10250133275985718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,128,balanced,0.10316800077756245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,128,power_law_1.01,0.10042239427566528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,128,power_law_1.01,0.10080640316009522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,128,power_law_1.2,0.09993600249290466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,128,power_law_1.2,0.10012799501419067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,16,balanced,0.24646933873494467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,16,balanced,0.24924800793329874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,16,power_law_1.01,0.2123136043548584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,16,power_law_1.01,0.2329279899597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,16,power_law_1.2,0.1962623953819275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,16,power_law_1.2,0.20709118843078614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,2,balanced,1.5770559310913086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,2,balanced,1.617194652557373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,2,power_law_1.01,1.2672575950622558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,2,power_law_1.01,1.2883968353271484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,2,power_law_1.2,1.2858112335205079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,2,power_law_1.2,1.3190655708312988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,256,balanced,0.08855467041333516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,256,balanced,0.09259200096130371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,256,power_law_1.01,0.08446720242500305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,256,power_law_1.01,0.09308159947395325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,256,power_law_1.2,0.08318719863891602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,256,power_law_1.2,0.09169279932975768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,32,balanced,0.14986667037010193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,32,balanced,0.1509866714477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,32,power_law_1.01,0.13285759687423707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,32,power_law_1.01,0.13553919792175292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,32,power_law_1.2,0.13645440340042114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,32,power_law_1.2,0.14379520416259767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,4,balanced,0.8254666328430176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,4,balanced,0.826591968536377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,4,power_law_1.01,0.659225606918335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,4,power_law_1.01,0.7531263828277588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,4,power_law_1.2,0.6487743854522705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,4,power_law_1.2,0.658732795715332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,64,balanced,0.11619200309117635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,64,balanced,0.11672533551851909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,64,power_law_1.01,0.11348479986190796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,64,power_law_1.01,0.11509120464324951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,64,power_law_1.2,0.11193599700927734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,64,power_law_1.2,0.11338880062103271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,8,balanced,0.4301439921061198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,8,balanced,0.43032534917195636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,8,power_law_1.01,0.38505599498748777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,8,power_law_1.01,0.3923135995864868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,8,power_law_1.2,0.3987391948699951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,1,8,power_law_1.2,0.408787202835083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,16,1,balanced,0.2585013310114543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,16,1,balanced,0.2587253252665202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,16,1,power_law_1.01,0.2027008056640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,16,1,power_law_1.01,0.20853760242462158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,16,1,power_law_1.2,0.2055743932723999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,16,1,power_law_1.2,0.2056447982788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,2,1,balanced,1.5862773259480794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,2,1,balanced,1.6060694058736165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,2,1,power_law_1.01,1.2329728126525878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,2,1,power_law_1.01,1.2390656471252441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,2,1,power_law_1.2,1.2223360061645507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,2,1,power_law_1.2,1.2443455696105956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,32,1,balanced,0.18133866786956787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,32,1,balanced,0.1823093295097351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,32,1,power_law_1.01,0.15564160346984862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,32,1,power_law_1.01,0.15593600273132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,32,1,power_law_1.2,0.1546239972114563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,32,1,power_law_1.2,0.15776000022888184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,4,1,balanced,0.8054080009460449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,4,1,balanced,0.8076960245768229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,4,1,power_law_1.01,0.6260416030883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,4,1,power_law_1.01,0.6276864051818848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,4,1,power_law_1.2,0.6102719783782959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,4,1,power_law_1.2,0.6217599868774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,8,1,balanced,0.4310133457183838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,8,1,balanced,0.43340798219045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,8,1,power_law_1.01,0.37387518882751464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,8,1,power_law_1.01,0.3756799936294556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,8,1,power_law_1.2,0.3715327978134155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2048,8,256,8,1,power_law_1.2,0.37582719326019287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,1,balanced,2.455178737640381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,1,balanced,2.459167957305908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,1,power_law_1.01,2.1600255966186523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,1,power_law_1.01,2.205452728271484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,1,power_law_1.2,2.193203163146973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,1,power_law_1.2,2.2204992294311525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,16,balanced,0.19495999813079834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,16,balanced,0.19806400934855142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,16,power_law_1.01,0.19200639724731444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,16,power_law_1.01,0.1934592008590698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,16,power_law_1.2,0.18849920034408568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,16,power_law_1.2,0.19009920358657836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,2,balanced,1.2688000202178955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,2,balanced,1.2712426980336506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,2,power_law_1.01,1.1321215629577637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,2,power_law_1.01,1.1388671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,2,power_law_1.2,1.1157823562622071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,2,power_law_1.2,1.1836480140686034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,32,balanced,0.13768000404040018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,32,balanced,0.13793599605560303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,32,power_law_1.01,0.12996480464935303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,32,power_law_1.01,0.13052159547805786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,32,power_law_1.2,0.13534719944000245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,32,power_law_1.2,0.13570560216903688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,4,balanced,0.6619093418121338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,4,balanced,0.6620373328526815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,4,power_law_1.01,0.6029248237609863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,4,power_law_1.01,0.6032959938049316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,4,power_law_1.2,0.5974720001220704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,4,power_law_1.2,0.6114687919616699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,8,balanced,0.3777120113372803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,8,balanced,0.38062934080759686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,8,power_law_1.01,0.363590407371521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,8,power_law_1.01,0.36742401123046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,8,power_law_1.2,0.36112000942230227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,1,8,power_law_1.2,0.36712958812713625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,16,1,balanced,0.21113600333531699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,16,1,balanced,0.2113493283589681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,16,1,power_law_1.01,0.19214080572128295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,16,1,power_law_1.01,0.1941375970840454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,16,1,power_law_1.2,0.18863999843597412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,16,1,power_law_1.2,0.18994560241699218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,2,1,balanced,1.245695988337199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,2,1,balanced,1.2501973311106365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,2,1,power_law_1.01,1.0707200050354004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,2,1,power_law_1.01,1.073798370361328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,2,1,power_law_1.2,1.084006404876709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,2,1,power_law_1.2,1.1382783889770507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,32,1,balanced,0.16270400087038675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,32,1,balanced,0.16429866353670755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,32,1,power_law_1.01,0.14215680360794067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,32,1,power_law_1.01,0.14645760059356688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,32,1,power_law_1.2,0.14538880586624145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,32,1,power_law_1.2,0.1511296033859253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,4,1,balanced,0.631498654683431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,4,1,balanced,0.637445330619812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,4,1,power_law_1.01,0.5819007873535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,4,1,power_law_1.01,0.5856575965881348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,4,1,power_law_1.2,0.5808063983917237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,4,1,power_law_1.2,0.5876863956451416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,8,1,balanced,0.3783573309580485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,8,1,balanced,0.3796000083287557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,8,1,power_law_1.01,0.3392191886901855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,8,1,power_law_1.01,0.3538431882858276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,8,1,power_law_1.2,0.3518143892288208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,6144,2560,8,160,8,1,power_law_1.2,0.3555072069168091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,1,balanced,3.630319913228353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,1,balanced,3.6323038736979165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,1,power_law_1.01,2.866431999206543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,1,power_law_1.01,2.8804031372070313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,1,power_law_1.2,2.7718528747558593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,1,power_law_1.2,2.830758476257324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,128,balanced,0.11395200093587239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,128,balanced,0.11555199821790059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,128,power_law_1.01,0.11249279975891113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,128,power_law_1.01,0.11285760402679443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,128,power_law_1.2,0.1124608039855957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,128,power_law_1.2,0.11264640092849731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,16,balanced,0.27688533067703247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,16,balanced,0.2776266733805339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,16,power_law_1.01,0.23843200206756593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,16,power_law_1.01,0.2513535976409912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,16,power_law_1.2,0.250598406791687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,16,power_law_1.2,0.25640320777893066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,2,balanced,1.874527931213379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,2,balanced,1.8896427154541016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,2,power_law_1.01,1.4446592330932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,2,power_law_1.01,1.4943936347961426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,2,power_law_1.2,1.510867214202881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,2,power_law_1.2,1.57708797454834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,256,balanced,0.10514133175214131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,256,balanced,0.10514666636784871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,256,power_law_1.01,0.10359040498733521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,256,power_law_1.01,0.104038405418396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,256,power_law_1.2,0.0942143976688385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,256,power_law_1.2,0.10477440357208252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,32,balanced,0.16845866044362387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,32,balanced,0.16875199476877847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,32,power_law_1.01,0.1587007999420166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,32,power_law_1.01,0.1600767970085144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,32,power_law_1.2,0.1514431953430176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,32,power_law_1.2,0.15162880420684816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,4,balanced,0.9650453726450602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,4,balanced,0.9716373284657797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,4,power_law_1.01,0.8485631942749023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,4,power_law_1.01,0.8712896347045899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,4,power_law_1.2,0.7452735900878906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,4,power_law_1.2,0.7575744152069092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,64,balanced,0.12946666280428568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,64,balanced,0.13014933466911316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,64,power_law_1.01,0.12667520046234132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,64,power_law_1.01,0.12833919525146484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,64,power_law_1.2,0.12680959701538086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,64,power_law_1.2,0.1274623990058899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,8,balanced,0.504693349202474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,8,balanced,0.5086986621220907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,8,power_law_1.01,0.445036792755127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,8,power_law_1.01,0.46857600212097167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,8,power_law_1.2,0.4384768009185791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,1,8,power_law_1.2,0.46155519485473634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,16,1,balanced,0.2990506688753764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,16,1,balanced,0.29945067564646405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,16,1,power_law_1.01,0.23680639266967773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,16,1,power_law_1.01,0.23915519714355468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,16,1,power_law_1.2,0.234771203994751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,16,1,power_law_1.2,0.23840000629425048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,2,1,balanced,1.8606239954630535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,2,1,balanced,1.8783200581868489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,2,1,power_law_1.01,1.4442560195922851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,2,1,power_law_1.01,1.4488767623901366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,2,1,power_law_1.2,1.438758373260498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,2,1,power_law_1.2,1.4529791831970216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,32,1,balanced,0.20694933334986368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,32,1,balanced,0.20705600579579672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,32,1,power_law_1.01,0.17607680559158326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,32,1,power_law_1.01,0.17840640544891356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,32,1,power_law_1.2,0.17653759717941284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,32,1,power_law_1.2,0.1767807960510254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,4,1,balanced,0.9415573279062907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,4,1,balanced,0.9435733159383138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,4,1,power_law_1.01,0.7315264225006104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,4,1,power_law_1.01,0.7448639869689941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,4,1,power_law_1.2,0.7269696235656739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,4,1,power_law_1.2,0.7281536102294922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,8,1,balanced,0.5009013414382935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,8,1,balanced,0.5010079940160116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,8,1,power_law_1.01,0.4343679904937744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,8,1,power_law_1.01,0.4362175941467285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,8,1,power_law_1.2,0.43438081741333007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,256,8,1,power_law_1.2,0.4359424114227295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,1,balanced,5.48252805074056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,1,balanced,5.526208241780599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,1,power_law_1.01,3.7482879638671873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,1,power_law_1.01,3.764326477050781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,1,power_law_1.2,3.6366527557373045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,1,power_law_1.2,3.6704769134521484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,128,balanced,0.1179200013478597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,128,balanced,0.1188106636206309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,128,power_law_1.01,0.11630719900131226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,128,power_law_1.01,0.11726080179214478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,128,power_law_1.2,0.11477119922637939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,128,power_law_1.2,0.11754239797592163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,16,balanced,0.44008533159891766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,16,balanced,0.4413919846216838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,16,power_law_1.01,0.35608959197998047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,16,power_law_1.01,0.4043712139129639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,16,power_law_1.2,0.35139200687408445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,16,power_law_1.2,0.3616960048675537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,2,balanced,2.7448161443074546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,2,balanced,2.7935358683268228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,2,power_law_1.01,1.8864511489868163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,2,power_law_1.01,2.015839958190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,2,power_law_1.2,1.954092788696289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,2,power_law_1.2,1.9952447891235352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,32,balanced,0.23227733373641968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,32,balanced,0.2346400022506714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,32,power_law_1.01,0.2232127904891968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,32,power_law_1.01,0.22357120513916015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,32,power_law_1.2,0.18885120153427123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,32,power_law_1.2,0.19571839570999144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,4,balanced,1.4073972702026367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,4,balanced,1.4098079999287922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,4,power_law_1.01,1.1260224342346192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,4,power_law_1.01,1.2148287773132325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,4,power_law_1.2,1.0682815551757812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,4,power_law_1.2,1.2591615676879884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,64,balanced,0.1441973348458608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,64,balanced,0.14520532886187235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,64,power_law_1.01,0.1410367965698242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,64,power_law_1.01,0.14227839708328247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,64,power_law_1.2,0.13649280071258546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,64,power_law_1.2,0.13667839765548706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,8,balanced,0.7283039887746176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,8,balanced,0.7288373311360677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,8,power_law_1.01,0.5967936038970947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,8,power_law_1.01,0.6371840000152588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,8,power_law_1.2,0.5757567882537842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,1,8,power_law_1.2,0.5807424068450928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,16,1,balanced,0.4731253385543823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,16,1,balanced,0.47650667031606037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,16,1,power_law_1.01,0.31319680213928225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,16,1,power_law_1.01,0.3170047998428345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,16,1,power_law_1.2,0.2946367979049683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,16,1,power_law_1.2,0.29780480861663816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,2,1,balanced,2.776362737019857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,2,1,balanced,2.7974398930867515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,2,1,power_law_1.01,1.9359743118286132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,2,1,power_law_1.01,1.9471807479858398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,2,1,power_law_1.2,1.8592256546020507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,2,1,power_law_1.2,1.8628032684326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,32,1,balanced,0.28110400835673016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,32,1,balanced,0.2820693254470825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,32,1,power_law_1.01,0.2117759943008423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,32,1,power_law_1.01,0.21276800632476806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,32,1,power_law_1.2,0.20823678970336915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,32,1,power_law_1.2,0.210534405708313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,4,1,balanced,1.3798240025838215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,4,1,balanced,1.3810240427652996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,4,1,power_law_1.01,0.9524864196777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,4,1,power_law_1.01,0.9710271835327149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,4,1,power_law_1.2,0.9367103576660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,4,1,power_law_1.2,0.9439231872558593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,8,1,balanced,0.7330933411916097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,8,1,balanced,0.7364266713460287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,8,1,power_law_1.01,0.5136000156402588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,8,1,power_law_1.01,0.5246848106384278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,8,1,power_law_1.2,0.5033279895782471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,80,7168,2048,8,384,8,1,power_law_1.2,0.5074944019317627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,1,balanced,0.8804852962493896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,1,balanced,0.8815680344899496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,1,power_law_1.01,1.0304832458496094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,1,power_law_1.01,1.0407039642333984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,1,power_law_1.2,1.0486335754394531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,1,power_law_1.2,1.0518527984619142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,128,balanced,0.40801600615183514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,128,balanced,0.40833067893981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,128,power_law_1.01,0.443609619140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,128,power_law_1.01,0.44795517921447753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,128,power_law_1.2,0.4786367893218994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,128,power_law_1.2,0.4803840160369873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,16,balanced,0.4466346502304077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,16,balanced,0.44886934757232666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,16,power_law_1.01,0.4949120044708252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,16,power_law_1.01,0.5009856224060059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,16,power_law_1.2,0.5245952129364013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,16,power_law_1.2,0.5414015769958496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,2,balanced,0.7483839988708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,2,balanced,0.7521226406097412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,2,power_law_1.01,0.8404800415039062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,2,power_law_1.01,0.8415295600891113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,2,power_law_1.2,0.8534655570983887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,2,power_law_1.2,0.8992832183837891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,32,balanced,0.4230240186055501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,32,balanced,0.424293319384257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,32,power_law_1.01,0.46894078254699706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,32,power_law_1.01,0.4810495853424072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,32,power_law_1.2,0.5041024208068847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,32,power_law_1.2,0.5073215961456299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,4,balanced,0.5771520137786865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,4,balanced,0.579584002494812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,4,power_law_1.01,0.6282944202423095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,4,power_law_1.01,0.6451519966125489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,4,power_law_1.2,0.6591936111450195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,4,power_law_1.2,0.6932608127593994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,64,balanced,0.41212264696757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,64,balanced,0.41319998105367023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,64,power_law_1.01,0.45269122123718264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,64,power_law_1.01,0.46359682083129883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,64,power_law_1.2,0.48209919929504397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,64,power_law_1.2,0.4990272045135498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,8,balanced,0.4899146556854248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,8,balanced,0.49008532365163165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,8,power_law_1.01,0.5478655815124511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,8,power_law_1.01,0.552288007736206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,8,power_law_1.2,0.5818175792694091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,1,8,power_law_1.2,0.6096255779266357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,2,1,balanced,0.6614240010579427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,2,1,balanced,0.6639039913813273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,2,1,power_law_1.01,0.7158080101013183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,2,1,power_law_1.01,0.7164224147796631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,2,1,power_law_1.2,0.7214399814605713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,2,1,power_law_1.2,0.724345588684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,4,1,balanced,0.49480001131693524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,4,1,balanced,0.4963573217391968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,4,1,power_law_1.01,0.5268095970153809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,4,1,power_law_1.01,0.5299520015716552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,4,1,power_law_1.2,0.5354368209838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2048,768,8,128,4,1,power_law_1.2,0.5355711936950683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,1,balanced,1.9591946601867676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,1,balanced,1.961359977722168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,1,power_law_1.01,2.1709184646606445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,1,power_law_1.01,2.1828351974487306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,1,power_law_1.2,2.205471992492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,1,power_law_1.2,2.2447423934936523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,128,balanced,0.5342239936192831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,128,balanced,0.5352746645609537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,128,power_law_1.01,0.6036928176879883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,128,power_law_1.01,0.6056000232696533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,128,power_law_1.2,0.6577600002288818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,128,power_law_1.2,0.7135871887207031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,16,balanced,0.6195840040842692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,16,balanced,0.6202026605606079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,16,power_law_1.01,0.761356782913208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,16,power_law_1.01,0.7622335910797119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,16,power_law_1.2,0.7940159797668457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,16,power_law_1.2,0.8035903930664062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,2,balanced,1.3110346794128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,2,balanced,1.322976032892863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,2,power_law_1.01,1.5358912467956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,2,power_law_1.01,1.54716796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,2,power_law_1.2,1.5946175575256347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,2,power_law_1.2,1.651430320739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,32,balanced,0.5702079931894938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,32,balanced,0.5714346567789713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,32,power_law_1.01,0.6737855911254883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,32,power_law_1.01,0.7036416053771972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,32,power_law_1.2,0.7098752021789551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,32,power_law_1.2,0.7618048191070557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,4,balanced,0.9326240221659342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,4,balanced,0.932965358098348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,4,power_law_1.01,1.060870361328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,4,power_law_1.01,1.119155216217041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,4,power_law_1.2,1.1774975776672363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,4,power_law_1.2,1.2460927963256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,64,balanced,0.5433386564254761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,64,balanced,0.5439253250757853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,64,power_law_1.01,0.6353600025177002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,64,power_law_1.01,0.6409855842590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,64,power_law_1.2,0.7024511814117431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,64,power_law_1.2,0.7588096141815186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,8,balanced,0.7245279947916666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,8,balanced,0.7248266537984213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,8,power_law_1.01,0.8770879745483399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,8,power_law_1.01,0.8799551963806153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,8,power_law_1.2,0.9292415618896485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,1,8,power_law_1.2,0.971827220916748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,16,1,balanced,0.9090773264567057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,16,1,balanced,0.9110399881998698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,16,1,power_law_1.01,1.0367551803588868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,16,1,power_law_1.01,1.0383808135986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,16,1,power_law_1.2,1.0422783851623536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,16,1,power_law_1.2,1.046553611755371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,2,1,balanced,1.2334453264872234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,2,1,balanced,1.2364160219828289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,2,1,power_law_1.01,1.3494208335876465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,2,1,power_law_1.01,1.3605055809020996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,2,1,power_law_1.2,1.3645376205444335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,2,1,power_law_1.2,1.37260160446167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,32,1,balanced,0.7471786340077718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,32,1,balanced,0.7480373382568359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,32,1,power_law_1.01,0.8553983688354492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,32,1,power_law_1.01,0.858675193786621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,32,1,power_law_1.2,0.8665920257568359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,32,1,power_law_1.2,0.8683072090148926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,4,1,balanced,0.7982772986094157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,4,1,balanced,0.7990826765696207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,4,1,power_law_1.01,0.8719936370849609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,4,1,power_law_1.01,0.8858240127563477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,4,1,power_law_1.2,0.88919038772583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,4,1,power_law_1.2,0.8908224105834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,8,1,balanced,1.1491999626159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,8,1,balanced,1.150607983271281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,8,1,power_law_1.01,1.30250244140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,8,1,power_law_1.01,1.303884792327881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,8,1,power_law_1.2,1.309727954864502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,2688,1856,6,128,8,1,power_law_1.2,1.3200127601623535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,1,balanced,2.9535252253214517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,1,balanced,3.0776373545328775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,1,power_law_1.01,3.2977344512939455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,1,power_law_1.01,3.472742462158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,1,power_law_1.2,3.5045761108398437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,1,power_law_1.2,3.525356674194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,128,balanced,0.6383893489837646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,128,balanced,0.6406613190968832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,128,power_law_1.01,0.7082880020141602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,128,power_law_1.01,0.7210752010345459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,128,power_law_1.2,0.7516223907470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,128,power_law_1.2,0.7737023830413818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,16,balanced,0.7609972953796387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,16,balanced,0.7623573144276937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,16,power_law_1.01,0.8953023910522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,16,power_law_1.01,0.9100480079650879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,16,power_law_1.2,0.9384767532348632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,16,power_law_1.2,0.9725312232971192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,2,balanced,1.7354826927185059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,2,balanced,1.7616747220357258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,2,power_law_1.01,2.014124870300293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,2,power_law_1.01,2.061625671386719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,2,power_law_1.2,2.0867904663085937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,2,power_law_1.2,2.105587196350098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,256,balanced,0.6335519949595133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,256,balanced,0.6336106856664022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,256,power_law_1.01,0.6842495918273925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,256,power_law_1.01,0.6848832130432129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,256,power_law_1.2,0.7539199829101563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,256,power_law_1.2,0.7662911891937256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,32,balanced,0.6928426424662272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,32,balanced,0.6954826513926188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,32,power_law_1.01,0.7962944030761718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,32,power_law_1.01,0.7973120212554932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,32,power_law_1.2,0.8549247741699219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,32,power_law_1.2,0.8795007705688477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,4,balanced,1.1772747039794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,4,balanced,1.1824373404184978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,4,power_law_1.01,1.4036479949951173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,4,power_law_1.01,1.4081855773925782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,4,power_law_1.2,1.4763968467712403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,4,power_law_1.2,1.5352704048156738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,64,balanced,0.6542719999949137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,64,balanced,0.6555413405100504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,64,power_law_1.01,0.7347583770751953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,64,power_law_1.01,0.7564223766326904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,64,power_law_1.2,0.7990208148956299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,64,power_law_1.2,0.8126463890075684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,8,balanced,0.9043359756469727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,8,balanced,0.9084213574727377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,8,power_law_1.01,1.0645248413085937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,8,power_law_1.01,1.0892928123474122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,8,power_law_1.2,1.1140992164611816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,1,8,power_law_1.2,1.1749247550964355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,16,1,balanced,0.6232213179270426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,16,1,balanced,0.6252640088399252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,16,1,power_law_1.01,0.6951871871948242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,16,1,power_law_1.01,0.6973120212554932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,16,1,power_law_1.2,0.7073215961456298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,16,1,power_law_1.2,0.7081791877746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,2,1,balanced,1.603834629058838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,2,1,balanced,1.6644694010416667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,2,1,power_law_1.01,1.854355239868164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,2,1,power_law_1.01,1.8563455581665038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,2,1,power_law_1.2,1.8905855178833009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,2,1,power_law_1.2,1.8964031219482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,32,1,balanced,0.5287733475367228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,32,1,balanced,0.5292426745096842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,32,1,power_law_1.01,0.5963391780853271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,32,1,power_law_1.01,0.6007040023803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,32,1,power_law_1.2,0.6007232189178466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,32,1,power_law_1.2,0.6038400173187256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,4,1,balanced,1.0112586816151936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,4,1,balanced,1.0124746958414714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,4,1,power_law_1.01,1.1514752388000489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,4,1,power_law_1.01,1.153273582458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,4,1,power_law_1.2,1.1756159782409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,4,1,power_law_1.2,1.1817407608032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,8,1,balanced,0.7386026382446289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,8,1,balanced,0.7405386765797933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,8,1,power_law_1.01,0.8234496116638184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,8,1,power_law_1.01,0.8262399673461914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,8,1,power_law_1.2,0.8434752464294434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,3072,1536,8,256,8,1,power_law_1.2,0.8450048446655274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,1,balanced,6.8662668863932295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,1,balanced,7.095114390055339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,1,power_law_1.01,6.898649597167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,1,power_law_1.01,7.156819152832031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,1,power_law_1.2,7.196473693847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,1,power_law_1.2,7.203545379638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,2,balanced,3.691957473754883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,2,balanced,3.7434666951497397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,2,power_law_1.01,5.030112075805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,2,power_law_1.01,5.325612640380859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,2,power_law_1.2,4.677056121826172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,2,power_law_1.2,5.076736068725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,4,balanced,2.2181973457336426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,4,balanced,2.254629294077555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,4,power_law_1.01,3.7038528442382814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,4,power_law_1.01,4.656921768188477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,4,power_law_1.2,3.965875244140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,4,power_law_1.2,3.9874496459960938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,8,balanced,1.5357012748718262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,8,balanced,1.5429654121398926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,8,power_law_1.01,3.348704147338867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,8,power_law_1.01,3.6444225311279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,8,power_law_1.2,3.5112384796142577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,1,8,power_law_1.2,3.7114303588867186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,16,1,balanced,0.5238826672236124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,16,1,balanced,0.528986652692159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,16,1,power_law_1.01,0.536684799194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,16,1,power_law_1.01,0.5422272205352783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,16,1,power_law_1.2,0.540019178390503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,16,1,power_law_1.2,0.5407999992370606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,2,1,balanced,3.201226552327474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,2,1,balanced,3.243562698364258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,2,1,power_law_1.01,3.2218559265136717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,2,1,power_law_1.01,3.246956634521484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,2,1,power_law_1.2,3.2287742614746096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,2,1,power_law_1.2,3.253433609008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,32,1,balanced,0.36295465628306073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,32,1,balanced,0.3632693290710449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,32,1,power_law_1.01,0.3690239906311035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,32,1,power_law_1.01,0.37098240852355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,32,1,power_law_1.2,0.3703232049942017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,32,1,power_law_1.2,0.3712703943252563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,4,1,balanced,1.5633813540140789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,4,1,balanced,1.5737226804097493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,4,1,power_law_1.01,1.6774656295776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,4,1,power_law_1.01,1.6859775543212892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,4,1,power_law_1.2,1.684422492980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,4,1,power_law_1.2,1.6858560562133789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,8,1,balanced,0.8651573657989502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,8,1,balanced,0.8790079752604166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,8,1,power_law_1.01,0.8958656311035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,8,1,power_law_1.01,0.9070976257324219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,8,1,power_law_1.2,0.9091456413269043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,14336,2,8,8,1,power_law_1.2,0.9149760246276856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,1,balanced,3.392160097757975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,1,balanced,3.3952000935872397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,1,power_law_1.01,3.609939193725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,1,power_law_1.01,3.693766403198242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,1,power_law_1.2,3.5791744232177733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,1,power_law_1.2,3.5883712768554688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,128,balanced,0.7083520094553629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,128,balanced,0.7088267008463541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,128,power_law_1.01,0.8497088432312012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,128,power_law_1.01,0.8546688079833984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,128,power_law_1.2,0.9606207847595215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,128,power_law_1.2,0.9646464347839355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,16,balanced,0.8476479848225912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,16,balanced,0.8505120277404785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,16,power_law_1.01,1.0716544151306153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,16,power_law_1.01,1.0848896026611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,16,power_law_1.2,1.1526975631713867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,16,power_law_1.2,1.2635775566101075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,2,balanced,2.07259194056193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,2,balanced,2.0801013310750327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,2,power_law_1.01,2.25229434967041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,2,power_law_1.01,2.3201919555664063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,2,power_law_1.2,2.3824640274047852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,2,power_law_1.2,2.5097280502319337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,32,balanced,0.7690613269805908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,32,balanced,0.7704693476359049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,32,power_law_1.01,0.9580287933349609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,32,power_law_1.01,0.9614272117614746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,32,power_law_1.2,1.0429696083068847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,32,power_law_1.2,1.0630335807800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,4,balanced,1.3374932607014973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,4,balanced,1.3428373336791992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,4,power_law_1.01,1.6097471237182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,4,power_law_1.01,1.6298431396484374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,4,power_law_1.2,1.6307968139648437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,4,power_law_1.2,1.6531391143798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,64,balanced,0.7301066716512045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,64,balanced,0.730400005976359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,64,power_law_1.01,0.8474368095397949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,64,power_law_1.01,0.8887295722961426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,64,power_law_1.2,0.9684160232543946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,64,power_law_1.2,1.016160011291504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,8,balanced,1.0131306648254395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,8,balanced,1.0137386322021484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,8,power_law_1.01,1.2306879997253417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,8,power_law_1.01,1.237337589263916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,8,power_law_1.2,1.2961088180541993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,1,8,power_law_1.2,1.357260799407959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,16,1,balanced,0.7546292940775553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,16,1,balanced,0.7557226816813151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,16,1,power_law_1.01,0.8213055610656739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,16,1,power_law_1.01,0.8227264404296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,16,1,power_law_1.2,0.8285951614379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,16,1,power_law_1.2,0.8290495872497559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,2,1,balanced,1.5478240648905437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,2,1,balanced,1.552303949991862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,2,1,power_law_1.01,1.862348747253418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,2,1,power_law_1.01,1.9282623291015626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,2,1,power_law_1.2,1.8643775939941407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,2,1,power_law_1.2,1.8698432922363282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,32,1,balanced,0.6404000123341879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,32,1,balanced,0.6409173409144083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,32,1,power_law_1.01,0.7036479949951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,32,1,power_law_1.01,0.7058752059936524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,32,1,power_law_1.2,0.7094528198242187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,32,1,power_law_1.2,0.7118207931518554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,4,1,balanced,1.1963413556416829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,4,1,balanced,1.1964213053385417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,4,1,power_law_1.01,1.2955583572387694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,4,1,power_law_1.01,1.3006591796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,4,1,power_law_1.2,1.315552043914795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,4,1,power_law_1.2,1.3171839714050293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,8,1,balanced,0.8822027047475179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,8,1,balanced,0.8832586606343588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,8,1,power_law_1.01,0.9552767753601075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,8,1,power_law_1.01,0.955782413482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,8,1,power_law_1.2,0.9568832397460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,1536,8,128,8,1,power_law_1.2,0.961580753326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,1,balanced,19.302021026611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,1,balanced,19.46136474609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,1,power_law_1.01,19.77650604248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,1,power_law_1.01,20.220530700683593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,1,power_law_1.2,20.225535583496093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,1,power_law_1.2,20.515565490722658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,128,balanced,2.5563467343648276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,128,balanced,2.5570240020751953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,128,power_law_1.01,2.820582389831543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,128,power_law_1.01,2.845683288574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,128,power_law_1.2,3.115488052368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,128,power_law_1.2,3.1443904876708983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,16,balanced,3.366938591003418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,16,balanced,3.3749332427978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,16,power_law_1.01,3.8787456512451173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,16,power_law_1.01,3.8926017761230467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,16,power_law_1.2,4.000620651245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,16,power_law_1.2,4.173222351074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,2,balanced,10.81369654337565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,2,balanced,10.865008036295572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,2,power_law_1.01,11.543199920654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,2,power_law_1.01,11.745452880859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,2,power_law_1.2,12.037094116210938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,2,power_law_1.2,12.555283355712891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,256,balanced,2.494474728902181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,256,balanced,2.500666618347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,256,power_law_1.01,2.734694480895996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,256,power_law_1.01,2.7579647064208985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,256,power_law_1.2,2.910495948791504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,256,power_law_1.2,2.956038475036621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,32,balanced,2.9006827672322593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,32,balanced,2.9046506881713867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,32,power_law_1.01,3.2587390899658204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,32,power_law_1.01,3.3974079132080077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,32,power_law_1.2,3.4203201293945313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,32,power_law_1.2,3.651667022705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,4,balanced,6.2923628489176435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,4,balanced,6.544938405354817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,4,power_law_1.01,7.290509033203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,4,power_law_1.01,7.3053123474121096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,4,power_law_1.2,7.073683166503907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,4,power_law_1.2,7.388877105712891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,64,balanced,2.670074780782064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,64,balanced,2.6725438435872397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,64,power_law_1.01,2.981088066101074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,64,power_law_1.01,3.044646453857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,64,power_law_1.2,3.235686492919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,64,power_law_1.2,3.370220947265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,8,balanced,4.303866704305013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,8,balanced,4.321541468302409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,8,power_law_1.01,4.8830207824707035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,8,power_law_1.01,4.931520080566406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,8,power_law_1.2,5.323788833618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,1,8,power_law_1.2,5.425344085693359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,16,1,balanced,5.321706771850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,16,1,balanced,5.324367841084798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,16,1,power_law_1.01,5.812467193603515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,16,1,power_law_1.01,5.821247863769531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,16,1,power_law_1.2,5.906022262573242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,16,1,power_law_1.2,5.912876892089844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,2,1,balanced,8.364240010579428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,2,1,balanced,8.820426940917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,2,1,power_law_1.01,9.584352111816406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,2,1,power_law_1.01,9.594048309326173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,2,1,power_law_1.2,9.577677154541016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,2,1,power_law_1.2,9.870066833496093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,32,1,balanced,4.670223871866862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,32,1,balanced,4.67961057027181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,32,1,power_law_1.01,5.103916931152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,32,1,power_law_1.01,5.122764968872071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,32,1,power_law_1.2,5.1824897766113285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,32,1,power_law_1.2,5.206950378417969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,4,1,balanced,17.09058125813802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,4,1,balanced,17.10308329264323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,4,1,power_law_1.01,16.99781188964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,4,1,power_law_1.01,17.02824249267578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,4,1,power_law_1.2,17.110546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,4,1,power_law_1.2,17.25020751953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,8,1,balanced,3.5643040339152017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,8,1,balanced,3.6280266443888345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,8,1,power_law_1.01,3.718431854248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,8,1,power_law_1.01,3.7327041625976562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,8,1,power_law_1.2,3.7757568359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,4096,2688,22,512,8,1,power_law_1.2,3.7905857086181642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,1,balanced,11.954427083333334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,1,balanced,11.986165364583334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,1,power_law_1.01,11.9067138671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,1,power_law_1.01,12.060396575927735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,1,power_law_1.2,12.119635009765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,1,power_law_1.2,12.275769805908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,2,balanced,6.0567200978597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,2,balanced,6.3995361328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,2,power_law_1.01,8.401766204833985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,2,power_law_1.01,8.976448059082031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,2,power_law_1.2,6.876230621337891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,2,power_law_1.2,9.353485107421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,4,balanced,3.488213221232096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,4,balanced,3.5217065811157227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,4,power_law_1.01,6.917407989501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,4,power_law_1.01,7.32069091796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,4,power_law_1.2,6.1510272979736325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,4,power_law_1.2,6.286067199707031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,8,balanced,2.138810634613037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,8,balanced,2.14630397160848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,8,power_law_1.01,5.597964859008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,8,power_law_1.01,5.827059173583985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,8,power_law_1.2,5.511212921142578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,1,8,power_law_1.2,5.895558547973633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,16,1,balanced,0.8144319852193197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,16,1,balanced,0.8167573610941569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,16,1,power_law_1.01,0.8613439559936523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,16,1,power_law_1.01,0.8629568099975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,16,1,power_law_1.2,0.8544575691223144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,16,1,power_law_1.2,0.8639103889465332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,2,1,balanced,5.470746358235677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,2,1,balanced,5.490224202473958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,2,1,power_law_1.01,5.628883361816406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,2,1,power_law_1.01,5.7024383544921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,2,1,power_law_1.2,5.521260833740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,2,1,power_law_1.2,5.528652954101562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,32,1,balanced,0.5416640043258667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,32,1,balanced,0.5453653335571289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,32,1,power_law_1.01,0.544697618484497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,32,1,power_law_1.01,0.5466432094573974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,32,1,power_law_1.2,0.5471039772033691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,32,1,power_law_1.2,0.5490111827850341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,4,1,balanced,2.767941474914551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,4,1,balanced,2.810954729715983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,4,1,power_law_1.01,2.719264030456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,4,1,power_law_1.01,2.7251775741577147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,4,1,power_law_1.2,2.7328128814697266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,4,1,power_law_1.2,2.766361618041992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,8,1,balanced,1.3844480514526367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,8,1,balanced,1.4189546902974446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,8,1,power_law_1.01,1.4784192085266112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,8,1,power_law_1.01,1.49237117767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,8,1,power_law_1.2,1.4822848320007325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,16384,2,8,8,1,power_law_1.2,1.4913408279418945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,1,balanced,7.334378560384114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,1,balanced,7.620341618855794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,1,power_law_1.01,8.883455657958985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,1,power_law_1.01,9.139730834960938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,1,power_law_1.2,9.071231842041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,1,power_law_1.2,9.11401596069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,128,balanced,1.0487840175628662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,128,balanced,1.0506079991658528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,128,power_law_1.01,1.243609619140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,128,power_law_1.01,1.2460351943969727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,128,power_law_1.2,1.3389247894287108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,128,power_law_1.2,1.3537919998168946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,16,balanced,1.3601120313008626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,16,balanced,1.3672854105631511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,16,power_law_1.01,1.648512077331543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,16,power_law_1.01,1.6823295593261718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,16,power_law_1.2,1.8839935302734374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,16,power_law_1.2,1.9457599639892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,2,balanced,4.128629366556804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,2,balanced,4.681162516276042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,2,power_law_1.01,5.039456176757812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,2,power_law_1.01,5.117984008789063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,2,power_law_1.2,5.141427230834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,2,power_law_1.2,5.342220687866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,256,balanced,1.0314559936523438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,256,balanced,1.0363840262095134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,256,power_law_1.01,1.1704704284667968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,256,power_law_1.01,1.1812416076660157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,256,power_law_1.2,1.315392017364502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,256,power_law_1.2,1.3554304122924805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,32,balanced,1.1823146343231201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,32,balanced,1.183898687362671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,32,power_law_1.01,1.4069567680358888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,32,power_law_1.01,1.470240020751953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,32,power_law_1.2,1.5714624404907227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,32,power_law_1.2,1.5871295928955078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,4,balanced,2.502415974934896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,4,balanced,2.50819730758667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,4,power_law_1.01,2.9412031173706055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,4,power_law_1.01,2.9760063171386717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,4,power_law_1.2,3.1383487701416017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,4,power_law_1.2,3.260326385498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,64,balanced,1.0964053471883137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,64,balanced,1.0980532964070637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,64,power_law_1.01,1.3233152389526368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,64,power_law_1.01,1.3436223983764648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,64,power_law_1.2,1.4199040412902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,64,power_law_1.2,1.5050880432128906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,8,balanced,1.7334133783976238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,8,balanced,1.734554608662923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,8,power_law_1.01,2.1640640258789063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,8,power_law_1.01,2.248198318481445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,8,power_law_1.2,2.430726432800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,1,8,power_law_1.2,2.4885183334350587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,16,1,balanced,1.150271972020467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,16,1,balanced,1.151029348373413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,16,1,power_law_1.01,1.281619167327881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,16,1,power_law_1.01,1.282630443572998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,16,1,power_law_1.2,1.2945280075073242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,16,1,power_law_1.2,1.2967552185058593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,2,1,balanced,3.8215627670288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,2,1,balanced,4.036954561869304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,2,1,power_law_1.01,4.555731201171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,2,1,power_law_1.01,4.584492874145508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,2,1,power_law_1.2,4.656537628173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,2,1,power_law_1.2,4.777267074584961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,32,1,balanced,0.9656480153401693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,32,1,balanced,0.966602643330892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,32,1,power_law_1.01,1.0881664276123046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,32,1,power_law_1.01,1.090003204345703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,32,1,power_law_1.2,1.1048576354980468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,32,1,power_law_1.2,1.1051712036132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,4,1,balanced,2.225269317626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,4,1,balanced,2.284730593363444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,4,1,power_law_1.01,2.5813119888305662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,4,1,power_law_1.01,2.583206367492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,4,1,power_law_1.2,2.6345792770385743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,4,1,power_law_1.2,2.673849678039551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,8,1,balanced,1.4959039688110352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,8,1,balanced,1.5082186063130696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,8,1,power_law_1.01,1.7161792755126952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,8,1,power_law_1.01,1.7204288482666015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,8,1,power_law_1.2,1.738809585571289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2048,8,256,8,1,power_law_1.2,1.7486656188964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,1,balanced,10.422490437825521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,1,balanced,10.710943857828775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,1,power_law_1.01,9.650457763671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,1,power_law_1.01,9.727065277099609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,1,power_law_1.2,9.527474975585937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,1,power_law_1.2,9.645247650146484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,16,balanced,1.5273280143737793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,16,balanced,1.534165382385254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,16,power_law_1.01,1.8583616256713866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,16,power_law_1.01,1.926950454711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,16,power_law_1.2,2.1313472747802735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,16,power_law_1.2,2.170572853088379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,2,balanced,5.289786656697591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,2,balanced,5.90224011739095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,2,power_law_1.01,5.648704147338867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,2,power_law_1.01,5.68787841796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,2,power_law_1.2,5.716249465942383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,2,power_law_1.2,6.07182731628418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,32,balanced,1.293877363204956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,32,balanced,1.2939679622650146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,32,power_law_1.01,1.6051328659057618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,32,power_law_1.01,1.6780864715576171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,32,power_law_1.2,1.8861312866210938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,32,power_law_1.2,2.0403072357177736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,4,balanced,3.050138791402181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,4,balanced,3.1249545415242515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,4,power_law_1.01,3.2983360290527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,4,power_law_1.01,3.6325119018554686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,4,power_law_1.2,3.7817150115966798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,4,power_law_1.2,3.7955135345458983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,8,balanced,2.019733270009359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,8,balanced,2.025381406148275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,8,power_law_1.01,2.467424011230469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,8,power_law_1.01,2.5077888488769533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,8,power_law_1.2,2.6173248291015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,1,8,power_law_1.2,2.8479551315307616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,16,1,balanced,1.3873173395792644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,16,1,balanced,1.3885653813680012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,16,1,power_law_1.01,1.3798144340515137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,16,1,power_law_1.01,1.3846847534179687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,16,1,power_law_1.2,1.3905216217041017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,16,1,power_law_1.2,1.3909312248229981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,2,1,balanced,5.398682912190755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,2,1,balanced,5.56550407409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,2,1,power_law_1.01,4.927148818969727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,2,1,power_law_1.01,5.031488037109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,2,1,power_law_1.2,4.851808166503906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,2,1,power_law_1.2,4.890816116333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,32,1,balanced,1.1925653616587322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,32,1,balanced,1.1943626403808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,32,1,power_law_1.01,1.1901311874389648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,32,1,power_law_1.01,1.190713596343994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,32,1,power_law_1.2,1.203987216949463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,32,1,power_law_1.2,1.2056768417358399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,4,1,balanced,2.8765281041463218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,4,1,balanced,2.8797972997029624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,4,1,power_law_1.01,2.7927679061889648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,4,1,power_law_1.01,2.825632095336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,4,1,power_law_1.2,2.7700288772583006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,4,1,power_law_1.2,2.816147232055664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,8,1,balanced,1.7685012817382812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,8,1,balanced,1.7902612686157227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,8,1,power_law_1.01,1.7635072708129882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,8,1,power_law_1.01,1.764512062072754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,8,1,power_law_1.2,1.7649919509887695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,6144,2560,8,160,8,1,power_law_1.2,1.7824127197265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,1,balanced,9.28769048055013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,1,balanced,9.320869445800781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,1,power_law_1.01,10.378975677490235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,1,power_law_1.01,10.405209350585938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,1,power_law_1.2,10.870944213867187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,1,power_law_1.2,10.877043151855469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,128,balanced,1.159727970759074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,128,balanced,1.1603893438975017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,128,power_law_1.01,1.3847616195678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,128,power_law_1.01,1.4183744430541991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,128,power_law_1.2,1.538271999359131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,128,power_law_1.2,1.5422783851623536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,16,balanced,1.5224800109863281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,16,balanced,1.5269120534261067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,16,power_law_1.01,1.8315839767456055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,16,power_law_1.01,1.953068733215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,16,power_law_1.2,2.0476991653442385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,16,power_law_1.2,2.1017215728759764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,2,balanced,4.91812801361084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,2,balanced,5.045066515604655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,2,power_law_1.01,5.924780654907226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,2,power_law_1.01,6.155231857299805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,2,power_law_1.2,6.0780799865722654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,2,power_law_1.2,6.218272018432617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,256,balanced,1.1367786725362141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,256,balanced,1.142250696818034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,256,power_law_1.01,1.290995216369629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,256,power_law_1.01,1.3115903854370117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,256,power_law_1.2,1.4501119613647462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,256,power_law_1.2,1.4807552337646483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,32,balanced,1.3150506814320881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,32,balanced,1.3152533372243245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,32,power_law_1.01,1.5829119682312012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,32,power_law_1.01,1.592915153503418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,32,power_law_1.2,1.7390144348144532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,32,power_law_1.2,1.9046207427978517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,4,balanced,2.893082618713379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,4,balanced,2.8980159759521484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,4,power_law_1.01,3.5798465728759767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,4,power_law_1.01,3.706233596801758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,4,power_law_1.2,3.9162368774414062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,4,power_law_1.2,3.9479934692382814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,64,balanced,1.2145493030548096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,64,balanced,1.2151947021484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,64,power_law_1.01,1.45664644241333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,64,power_law_1.01,1.464755153656006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,64,power_law_1.2,1.653228759765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,64,power_law_1.2,1.6790143966674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,8,balanced,1.9515679677327473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,8,balanced,1.964080015818278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,8,power_law_1.01,2.4994688034057617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,8,power_law_1.01,2.553932762145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,8,power_law_1.2,2.693222427368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,1,8,power_law_1.2,2.8364288330078127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,16,1,balanced,1.3218560218811035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,16,1,balanced,1.3269013563791912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,16,1,power_law_1.01,1.4749055862426759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,16,1,power_law_1.01,1.4785920143127442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,16,1,power_law_1.2,1.4904959678649903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,16,1,power_law_1.2,1.499891185760498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,2,1,balanced,4.316778818766276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,2,1,balanced,4.517392158508301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,2,1,power_law_1.01,5.323993682861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,2,1,power_law_1.01,5.501497650146485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,2,1,power_law_1.2,5.367462539672852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,2,1,power_law_1.2,5.481407928466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,32,1,balanced,1.1076160271962483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,32,1,balanced,1.1088746388753254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,32,1,power_law_1.01,1.2533503532409669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,32,1,power_law_1.01,1.2542079925537108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,32,1,power_law_1.2,1.265004825592041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,32,1,power_law_1.2,1.2658623695373534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,4,1,balanced,2.620512008666992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,4,1,balanced,2.7577387491861978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,4,1,power_law_1.01,2.9426752090454102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,4,1,power_law_1.01,3.0302976608276366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,4,1,power_law_1.2,3.052646446228027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,4,1,power_law_1.2,3.1198272705078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,8,1,balanced,1.728256066640218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,8,1,balanced,1.7286720275878906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,8,1,power_law_1.01,1.9857919692993165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,8,1,power_law_1.01,1.9895360946655274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,8,1,power_law_1.2,2.009574317932129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,256,8,1,power_law_1.2,2.0167680740356446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,1,balanced,11.9945068359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,1,balanced,12.343589782714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,1,power_law_1.01,12.132109069824219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,1,power_law_1.01,12.364979553222657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,1,power_law_1.2,12.3548095703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,1,power_law_1.2,12.4980224609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,128,balanced,1.2421600023905437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,128,balanced,1.2453227043151855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,128,power_law_1.01,1.4086272239685058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,128,power_law_1.01,1.41145601272583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,128,power_law_1.2,1.4960512161254882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,128,power_law_1.2,1.5342592239379882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,16,balanced,1.7630133628845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,16,balanced,1.7673226992289226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,16,power_law_1.01,2.0227071762084963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,16,power_law_1.01,2.1689727783203123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,16,power_law_1.2,2.153900718688965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,16,power_law_1.2,2.2254207611083983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,2,balanced,6.55726941426595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,2,balanced,6.746421178181966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,2,power_law_1.01,6.846073913574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,2,power_law_1.01,6.919795227050781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,2,power_law_1.2,6.8245697021484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,2,power_law_1.2,7.0424957275390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,32,balanced,1.4611679712931316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,32,balanced,1.4645493825276692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,32,power_law_1.01,1.6767423629760743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,32,power_law_1.01,1.678316879272461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,32,power_law_1.2,1.7665023803710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,32,power_law_1.2,1.7682880401611327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,4,balanced,3.605285326639811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,4,balanced,3.6242027282714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,4,power_law_1.01,3.911590576171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,4,power_law_1.01,3.9712318420410155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,4,power_law_1.2,4.0665534973144535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,4,power_law_1.2,4.374367904663086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,64,balanced,1.316111962000529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,64,balanced,1.3175040086110432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,64,power_law_1.01,1.483084774017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,64,power_law_1.01,1.507692813873291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,64,power_law_1.2,1.6044607162475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,64,power_law_1.2,1.640608024597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,8,balanced,2.3694666226704917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,8,balanced,2.3837119738260903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,8,power_law_1.01,2.676140785217285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,8,power_law_1.01,2.6770368576049806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,8,power_law_1.2,2.7548351287841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,1,8,power_law_1.2,2.8727807998657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,16,1,balanced,1.6589706738789876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,16,1,balanced,1.6648267110188801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,16,1,power_law_1.01,1.654732894897461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,16,1,power_law_1.01,1.6586175918579102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,16,1,power_law_1.2,1.6751487731933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,16,1,power_law_1.2,1.6882816314697267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,2,1,balanced,6.397424062093099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,2,1,balanced,6.54258664449056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,2,1,power_law_1.01,6.228364944458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,2,1,power_law_1.01,6.348921585083008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,2,1,power_law_1.2,6.391353607177734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,2,1,power_law_1.2,6.447360229492188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,32,1,balanced,1.3592212994893391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,32,1,balanced,1.3595466613769531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,32,1,power_law_1.01,1.3510656356811523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,32,1,power_law_1.01,1.356601619720459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,32,1,power_law_1.2,1.3750847816467284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,32,1,power_law_1.2,1.3760512351989747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,4,1,balanced,3.523215929667155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,4,1,balanced,3.5400638580322266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,4,1,power_law_1.01,3.3740352630615233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,4,1,power_law_1.01,3.4698814392089843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,4,1,power_law_1.2,3.4616127014160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,4,1,power_law_1.2,3.523392105102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,8,1,balanced,2.226741313934326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,8,1,balanced,2.2361653645833335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,8,1,power_law_1.01,2.218707275390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,8,1,power_law_1.01,2.21978874206543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,8,1,power_law_1.2,2.2858943939208984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,8192,7168,2048,8,384,8,1,power_law_1.2,2.299660873413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,1,balanced,0.2092746694882711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,1,balanced,0.20973867177963257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,1,power_law_1.01,0.1962175965309143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,1,power_law_1.01,0.199072003364563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,1,power_law_1.2,0.20210559368133546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,1,power_law_1.2,0.20364799499511718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,128,balanced,0.03748800108830134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,128,balanced,0.03934400031963984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,128,power_law_1.01,0.03591040074825287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,128,power_law_1.01,0.03711360096931458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,128,power_law_1.2,0.036345601081848145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,128,power_law_1.2,0.03671039938926697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,16,balanced,0.047839999198913574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,16,balanced,0.04971200227737427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,16,power_law_1.01,0.043750399351119997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,16,power_law_1.01,0.04405759871006012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,16,power_law_1.2,0.044377601146698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,16,power_law_1.2,0.04447999894618988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,2,balanced,0.14512000481287637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,2,balanced,0.14813866217931113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,2,power_law_1.01,0.1375872015953064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,2,power_law_1.01,0.13852800130844117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,2,power_law_1.2,0.1379263997077942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,2,power_law_1.2,0.13987840414047242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,32,balanced,0.037503999968369804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,32,balanced,0.03826133410135905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,32,power_law_1.01,0.03683840036392212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,32,power_law_1.01,0.037376001477241516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,32,power_law_1.2,0.03681919872760773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,32,power_law_1.2,0.03688960075378418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,4,balanced,0.08213333288828532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,4,balanced,0.08223466575145721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,4,power_law_1.01,0.07834240198135375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,4,power_law_1.01,0.07959679961204529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,4,power_law_1.2,0.07923840284347534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,4,power_law_1.2,0.07946239709854126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,64,balanced,0.037674665451049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,64,balanced,0.03770133356253306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,64,power_law_1.01,0.036057600378990175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,64,power_law_1.01,0.03648639917373657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,64,power_law_1.2,0.036800000071525577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,64,power_law_1.2,0.037049600481987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,8,balanced,0.06355200211207072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,8,balanced,0.0639466643333435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,8,power_law_1.01,0.05976319909095764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,8,power_law_1.01,0.060524797439575194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,8,power_law_1.2,0.060755199193954466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,1,8,power_law_1.2,0.060889601707458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,2,1,balanced,0.14356799920399985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,2,1,balanced,0.1450399955113729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,2,1,power_law_1.01,0.1346560001373291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,2,1,power_law_1.01,0.13639039993286134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,2,1,power_law_1.2,0.13713279962539673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,2,1,power_law_1.2,0.14017280340194702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,4,1,balanced,0.08418132861455281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,4,1,balanced,0.08452266454696655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,4,1,power_law_1.01,0.07842559814453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,4,1,power_law_1.01,0.07900159955024719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,4,1,power_law_1.2,0.07928320169448852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2048,768,8,128,4,1,power_law_1.2,0.08016639947891235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,1,balanced,0.5810079971949259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,1,balanced,0.5844320058822632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,1,power_law_1.01,0.5096127986907959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,1,power_law_1.01,0.5339776039123535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,1,power_law_1.2,0.5237055778503418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,1,power_law_1.2,0.5357759952545166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,128,balanced,0.04593066871166229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,128,balanced,0.04788800080617269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,128,power_law_1.01,0.04561919867992401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,128,power_law_1.01,0.04601599872112274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,128,power_law_1.2,0.046387198567390445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,128,power_law_1.2,0.046419200301170346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,16,balanced,0.0824533353249232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,16,balanced,0.08335466186205547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,16,power_law_1.01,0.07993599772453308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,16,power_law_1.01,0.0800383985042572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,16,power_law_1.2,0.07938560247421264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,16,power_law_1.2,0.07975040078163147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,2,balanced,0.36689599355061847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,2,balanced,0.3673653205235799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,2,power_law_1.01,0.30794880390167234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,2,power_law_1.01,0.3262399911880493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,2,power_law_1.2,0.3104768037796021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,2,power_law_1.2,0.33035519123077395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,32,balanced,0.07134933272997539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,32,balanced,0.07146666447321574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,32,power_law_1.01,0.06840320229530335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,32,power_law_1.01,0.07027199864387512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,32,power_law_1.2,0.06918399930000305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,32,power_law_1.2,0.06951040029525757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,4,balanced,0.205567995707194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,4,balanced,0.20957332849502563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,4,power_law_1.01,0.1850111961364746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,4,power_law_1.01,0.1913151979446411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,4,power_law_1.2,0.1889407992362976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,4,power_law_1.2,0.2007040023803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,64,balanced,0.04703466594219208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,64,balanced,0.049925332268079124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,64,power_law_1.01,0.05123199820518494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,64,power_law_1.01,0.052691197395324706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,64,power_law_1.2,0.04615040123462677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,64,power_law_1.2,0.049721598625183105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,8,balanced,0.11345600088437398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,8,balanced,0.11346133550008138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,8,power_law_1.01,0.10771839618682862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,8,power_law_1.01,0.10818560123443603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,8,power_law_1.2,0.10488959550857543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,1,8,power_law_1.2,0.10524799823760986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,16,1,balanced,0.24475733439127603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,16,1,balanced,0.2454026738802592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,16,1,power_law_1.01,0.20881919860839843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,16,1,power_law_1.01,0.21902720928192138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,16,1,power_law_1.2,0.21994240283966066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,16,1,power_law_1.2,0.22033920288085937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,2,1,balanced,0.3535573482513428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,2,1,balanced,0.35674134890238446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,2,1,power_law_1.01,0.3014080047607422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,2,1,power_law_1.01,0.3036799907684326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,2,1,power_law_1.2,0.3013184070587158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,2,1,power_law_1.2,0.3077568054199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,32,1,balanced,0.1962666710217794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,32,1,balanced,0.19670399030049643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,32,1,power_law_1.01,0.17169920206069947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,32,1,power_law_1.01,0.17698559761047364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,32,1,power_law_1.2,0.17148799896240235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,32,1,power_law_1.2,0.17397119998931884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,4,1,balanced,0.19347200791041055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,4,1,balanced,0.1950613260269165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,4,1,power_law_1.01,0.17971199750900269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,4,1,power_law_1.01,0.18077440261840821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,4,1,power_law_1.2,0.18140799999237062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,4,1,power_law_1.2,0.18472319841384888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,8,1,balanced,0.422815998395284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,8,1,balanced,0.4248533248901367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,8,1,power_law_1.01,0.362444806098938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,8,1,power_law_1.01,0.37436161041259763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,8,1,power_law_1.2,0.3650048017501831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,2688,1856,6,128,8,1,power_law_1.2,0.3714368104934692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,1,balanced,1.1844586531321208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,1,balanced,1.1994826793670654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,1,power_law_1.01,0.9291839599609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,1,power_law_1.01,0.9387071609497071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,1,power_law_1.2,0.9181759834289551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,1,power_law_1.2,0.9442303657531739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,128,balanced,0.04966933528582255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,128,balanced,0.05410666763782501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,128,power_law_1.01,0.04806399941444397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,128,power_law_1.01,0.048307201266288756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,128,power_law_1.2,0.0500927984714508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,128,power_law_1.2,0.050323200225830075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,16,balanced,0.11370666821797688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,16,balanced,0.11482133467992146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,16,power_law_1.01,0.10209280252456665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,16,power_law_1.01,0.10254080295562744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,16,power_law_1.2,0.10017280578613282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,16,power_law_1.2,0.10984959602355956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,2,balanced,0.6197706858317057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,2,balanced,0.6259573300679525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,2,power_law_1.01,0.521011209487915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,2,power_law_1.01,0.5260799884796142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,2,power_law_1.2,0.513759994506836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,2,power_law_1.2,0.5168255805969239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,256,balanced,0.04783466458320618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,256,balanced,0.04986133178075155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,256,power_law_1.01,0.04684160053730011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,256,power_law_1.01,0.04733439981937408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,256,power_law_1.2,0.04746879935264588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,256,power_law_1.2,0.047775998711586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,32,balanced,0.08365333080291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,32,balanced,0.08449066678682964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,32,power_law_1.01,0.08010879755020142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,32,power_law_1.01,0.08095359802246094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,32,power_law_1.2,0.07888000011444092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,32,power_law_1.2,0.0800383985042572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,4,balanced,0.33103466033935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,4,balanced,0.33292800188064575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,4,power_law_1.01,0.28786559104919435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,4,power_law_1.01,0.2960767984390259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,4,power_law_1.2,0.27654399871826174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,4,power_law_1.2,0.2882623910903931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,64,balanced,0.0703306645154953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,64,balanced,0.07106133302052815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,64,power_law_1.01,0.06895359754562377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,64,power_law_1.01,0.06914560198783874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,64,power_law_1.2,0.0676479995250702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,64,power_law_1.2,0.06846719980239868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,8,balanced,0.21230934063593546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,8,balanced,0.21450134118398032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,8,power_law_1.01,0.1937407970428467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,8,power_law_1.01,0.19406720399856567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,8,power_law_1.2,0.15808000564575195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,1,8,power_law_1.2,0.1771456003189087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,16,1,balanced,0.12916266918182373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,16,1,balanced,0.12966400384902954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,16,1,power_law_1.01,0.11205120086669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,16,1,power_law_1.01,0.11242879629135132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,16,1,power_law_1.2,0.1086400032043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,16,1,power_law_1.2,0.10904959440231324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,2,1,balanced,0.6174933513005575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,2,1,balanced,0.618506669998169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,2,1,power_law_1.01,0.48404479026794434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,2,1,power_law_1.01,0.48901758193969724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,2,1,power_law_1.2,0.4851583957672119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,2,1,power_law_1.2,0.4971007823944092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,32,1,balanced,0.0999840001265208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,32,1,balanced,0.10058133800824483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,32,1,power_law_1.01,0.08732799887657165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,32,1,power_law_1.01,0.08867200016975403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,32,1,power_law_1.2,0.08703359961509705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,32,1,power_law_1.2,0.08799359798431397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,4,1,balanced,0.3250240087509155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,4,1,balanced,0.3272479971249898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,4,1,power_law_1.01,0.27614080905914307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,4,1,power_law_1.01,0.2836287975311279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,4,1,power_law_1.2,0.271891188621521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,4,1,power_law_1.2,0.2785088062286377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,8,1,balanced,0.2092319925626119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,8,1,balanced,0.21185600757598877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,8,1,power_law_1.01,0.1721984028816223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,8,1,power_law_1.01,0.17422720193862914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,8,1,power_law_1.2,0.1683583974838257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,3072,1536,8,256,8,1,power_law_1.2,0.17496320009231567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,1,balanced,0.5395093361536661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,1,balanced,0.545743981997172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,1,power_law_1.01,0.6057792186737061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,1,power_law_1.01,0.6209280014038085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,1,power_law_1.2,0.5938879966735839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,1,power_law_1.2,0.6043392181396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,2,balanced,0.3362186749776204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,2,balanced,0.33699198563893634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,2,power_law_1.01,0.3855168104171753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,2,power_law_1.01,0.3978111982345581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,2,power_law_1.2,0.3766016006469727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,2,power_law_1.2,0.39347200393676757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,4,balanced,0.23281600077946982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,4,balanced,0.24022400379180908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,4,power_law_1.01,0.28263680934906005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,4,power_law_1.01,0.28965120315551757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,4,power_law_1.2,0.29038081169128416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,4,power_law_1.2,0.29066879749298097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,8,balanced,0.20177066326141357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,8,balanced,0.20349866151809692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,8,power_law_1.01,0.2275968074798584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,8,power_law_1.01,0.24142720699310302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,8,power_law_1.2,0.23629438877105713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,1,8,power_law_1.2,0.23998720645904542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,16,1,balanced,0.07639466722806294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,16,1,balanced,0.07660800218582153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,16,1,power_law_1.01,0.07566720247268677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,16,1,power_law_1.01,0.07596799731254578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,16,1,power_law_1.2,0.07402880191802978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,16,1,power_law_1.2,0.0765887975692749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,2,1,balanced,0.2850666642189026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,2,1,balanced,0.28521599372227985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,2,1,power_law_1.01,0.29171199798583985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,2,1,power_law_1.01,0.3026432037353516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,2,1,power_law_1.2,0.299289608001709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,2,1,power_law_1.2,0.30062079429626465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,32,1,balanced,0.05982933441797892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,32,1,balanced,0.06432533264160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,32,1,power_law_1.01,0.06286720037460328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,32,1,power_law_1.01,0.06302719712257385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,32,1,power_law_1.2,0.061433601379394534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,32,1,power_law_1.2,0.06247040033340454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,4,1,balanced,0.1564533313115438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,4,1,balanced,0.15678399801254272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,4,1,power_law_1.01,0.17063679695129394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,4,1,power_law_1.01,0.17378560304641724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,4,1,power_law_1.2,0.1583359956741333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,4,1,power_law_1.2,0.17557120323181152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,8,1,balanced,0.10335999727249146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,8,1,balanced,0.10378133257230122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,8,1,power_law_1.01,0.09981439709663391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,8,1,power_law_1.01,0.1014847993850708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,8,1,power_law_1.2,0.10105600357055664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,14336,2,8,8,1,power_law_1.2,0.10124800205230713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,1,balanced,0.8166453043619791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,1,balanced,0.817242701848348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,1,power_law_1.01,0.7521791934967041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,1,power_law_1.01,0.7681600093841553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,1,power_law_1.2,0.7659264087677002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,1,power_law_1.2,0.7800767898559571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,128,balanced,0.05393599967161814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,128,balanced,0.05402666827042898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,128,power_law_1.01,0.052313601970672606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,128,power_law_1.01,0.05235840082168579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,128,power_law_1.2,0.05253120064735413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,128,power_law_1.2,0.052825599908828735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,16,balanced,0.09804266691207886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,16,balanced,0.09904533624649048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,16,power_law_1.01,0.0939136028289795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,16,power_law_1.01,0.09499520063400269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,16,power_law_1.2,0.09404799938201905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,16,power_law_1.2,0.09529600143432618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,2,balanced,0.43108801047007245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,2,balanced,0.43186668554941815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,2,power_law_1.01,0.40491518974304197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,2,power_law_1.01,0.4138175964355469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,2,power_law_1.2,0.4067647933959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,2,power_law_1.2,0.41730561256408694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,32,balanced,0.08283733328183492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,32,balanced,0.0830506682395935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,32,power_law_1.01,0.07984640002250672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,32,power_law_1.01,0.08121600151062011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,32,power_law_1.2,0.081004798412323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,32,power_law_1.2,0.08170239925384522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,4,balanced,0.2548533280690511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,4,balanced,0.25814932584762573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,4,power_law_1.01,0.24411520957946778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,4,power_law_1.01,0.2511807918548584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,4,power_law_1.2,0.23490560054779053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,4,power_law_1.2,0.2527424097061157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,64,balanced,0.06420266628265381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,64,balanced,0.06810666620731354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,64,power_law_1.01,0.06643199920654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,64,power_law_1.01,0.07013760209083557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,64,power_law_1.2,0.06368640065193176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,64,power_law_1.2,0.06814079880714416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,8,balanced,0.13854933778444925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,8,balanced,0.13988266388575235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,8,power_law_1.01,0.12917759418487548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,8,power_law_1.01,0.130457603931427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,8,power_law_1.2,0.13521920442581176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,1,8,power_law_1.2,0.13665920495986938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,16,1,balanced,0.10356799761454265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,16,1,balanced,0.10518399874369304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,16,1,power_law_1.01,0.09960319995880126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,16,1,power_law_1.01,0.09964159727096558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,16,1,power_law_1.2,0.10042879581451417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,16,1,power_law_1.2,0.10113279819488526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,2,1,balanced,0.38921598593393963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,2,1,balanced,0.3901120026906331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,2,1,power_law_1.01,0.36326398849487307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,2,1,power_law_1.01,0.36419200897216797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,2,1,power_law_1.2,0.3721280097961426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,2,1,power_law_1.2,0.3734591960906982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,32,1,balanced,0.08681600292523702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,32,1,balanced,0.08861866593360901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,32,1,power_law_1.01,0.08398720026016235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,32,1,power_law_1.01,0.08438400030136109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,32,1,power_law_1.2,0.0844223976135254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,32,1,power_law_1.2,0.0856383979320526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,4,1,balanced,0.2540000081062317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,4,1,balanced,0.2560799916585286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,4,1,power_law_1.01,0.24705278873443604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,4,1,power_law_1.01,0.24726400375366211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,4,1,power_law_1.2,0.2452608108520508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,4,1,power_law_1.2,0.24791040420532226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,8,1,balanced,0.1397813359896342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,8,1,balanced,0.14040000240008035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,8,1,power_law_1.01,0.1306496024131775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,8,1,power_law_1.01,0.1340224027633667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,8,1,power_law_1.2,0.13389439582824708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,1536,8,128,8,1,power_law_1.2,0.13444479703903198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,1,balanced,5.4415842692057295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,1,balanced,5.467274983723958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,1,power_law_1.01,4.611238479614258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,1,power_law_1.01,4.684864044189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,1,power_law_1.2,4.6670783996582035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,1,power_law_1.2,4.7481025695800785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,128,balanced,0.12225600083669026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,128,balanced,0.12271466851234436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,128,power_law_1.01,0.12041599750518799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,128,power_law_1.01,0.12067199945449829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,128,power_law_1.2,0.1198464035987854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,128,power_law_1.2,0.1199679970741272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,16,balanced,0.4189759890238444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,16,balanced,0.4219199816385905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,16,power_law_1.01,0.3771775960922241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,16,power_law_1.01,0.39022719860076904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,16,power_law_1.2,0.38453121185302735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,16,power_law_1.2,0.39064319133758546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,2,balanced,2.746074676513672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,2,balanced,2.776858647664388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,2,power_law_1.01,2.3471551895141602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,2,power_law_1.01,2.422323226928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,2,power_law_1.2,2.376460838317871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,2,power_law_1.2,2.437164878845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,256,balanced,0.10640000303586324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,256,balanced,0.10697066783905029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,256,power_law_1.01,0.10460799932479858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,256,power_law_1.01,0.10481280088424683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,256,power_law_1.2,0.1043328046798706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,256,power_law_1.2,0.10594559907913208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,32,balanced,0.25704000393549603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,32,balanced,0.2675519982973735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,32,power_law_1.01,0.22362880706787108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,32,power_law_1.01,0.2432703971862793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,32,power_law_1.2,0.22569599151611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,32,power_law_1.2,0.25438079833984373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,4,balanced,1.4090666770935059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,4,balanced,1.4170239766438801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,4,power_law_1.01,1.1960063934326173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,4,power_law_1.01,1.226137638092041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,4,power_law_1.2,1.2382847785949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,4,power_law_1.2,1.2409088134765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,64,balanced,0.15213333566983542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,64,balanced,0.15286399920781454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,64,power_law_1.01,0.14569599628448487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,64,power_law_1.01,0.14814079999923707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,64,power_law_1.2,0.14234880208969117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,64,power_law_1.2,0.15066239833831788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,8,balanced,0.7389280001322428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,8,balanced,0.7416213353474935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,8,power_law_1.01,0.6538496017456055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,8,power_law_1.01,0.7067200183868408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,8,power_law_1.2,0.660038423538208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,1,8,power_law_1.2,0.6922560214996338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,16,1,balanced,1.8127360343933105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,16,1,balanced,1.814245382944743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,16,1,power_law_1.01,1.5499839782714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,16,1,power_law_1.01,1.5517824172973633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,16,1,power_law_1.2,1.5673983573913575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,16,1,power_law_1.2,1.5764991760253906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,2,1,balanced,2.4479519526163735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,2,1,balanced,2.4664692878723145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,2,1,power_law_1.01,2.099782371520996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,2,1,power_law_1.01,2.1195199966430662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,2,1,power_law_1.2,2.1082048416137695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,2,1,power_law_1.2,2.125695991516113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,32,1,balanced,1.213701327641805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,32,1,balanced,1.2163626352945964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,32,1,power_law_1.01,1.0407936096191406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,32,1,power_law_1.01,1.050815963745117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,32,1,power_law_1.2,1.057203197479248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,4,1,balanced,1.4039093653361003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,4,1,balanced,1.4040640195210774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,4,1,power_law_1.01,1.200057601928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,4,1,power_law_1.01,1.2117631912231446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,4,1,power_law_1.2,1.1993023872375488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,4,1,power_law_1.2,1.2481216430664062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,8,1,balanced,0.755413293838501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,8,1,balanced,0.7640693187713623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,8,1,power_law_1.01,0.6563648223876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,8,1,power_law_1.01,0.657919979095459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,8,1,power_law_1.2,0.6629951953887939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,4096,2688,22,512,8,1,power_law_1.2,0.6638591766357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,1,balanced,0.8616373538970947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,1,balanced,0.8636000156402588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,1,power_law_1.01,1.0109888076782227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,1,power_law_1.01,1.0162943840026855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,1,power_law_1.2,0.9924287796020508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,1,power_law_1.2,1.0222911834716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,2,balanced,0.48687465985616046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,2,balanced,0.489898681640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,2,power_law_1.01,0.6063744068145752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,2,power_law_1.01,0.6127744197845459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,2,power_law_1.2,0.5802815914154053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,2,power_law_1.2,0.5978367805480957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,4,balanced,0.31587199370066327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,4,balanced,0.31937066713968915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,4,power_law_1.01,0.39175679683685305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,4,power_law_1.01,0.39832320213317873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,4,power_law_1.2,0.4003456115722656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,4,power_law_1.2,0.40414719581604003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,8,balanced,0.25593066215515137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,8,balanced,0.2577066620190938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,8,power_law_1.01,0.29374079704284667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,8,power_law_1.01,0.2956928014755249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,8,power_law_1.2,0.2830976009368896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,1,8,power_law_1.2,0.3241280078887939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,16,1,balanced,0.10139200091362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,16,1,balanced,0.10173867146174113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,16,1,power_law_1.01,0.10285439491271972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,16,1,power_law_1.01,0.10511360168457032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,16,1,power_law_1.2,0.10371199846267701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,16,1,power_law_1.2,0.10414079427719117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,2,1,balanced,0.44249598185221356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,2,1,balanced,0.4620000123977661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,2,1,power_law_1.01,0.4832128047943115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,2,1,power_law_1.01,0.49706878662109377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,2,1,power_law_1.2,0.4872576236724854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,2,1,power_law_1.2,0.5046016216278076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,32,1,balanced,0.08690133690834045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,32,1,balanced,0.08778666456540425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,32,1,power_law_1.01,0.08678399920463561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,32,1,power_law_1.01,0.08687360286712646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,32,1,power_law_1.2,0.08655359745025634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,32,1,power_law_1.2,0.08662400245666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,4,1,balanced,0.23794132471084595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,4,1,balanced,0.24315732717514038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,4,1,power_law_1.01,0.26777598857879636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,4,1,power_law_1.01,0.274617600440979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,4,1,power_law_1.2,0.267193603515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,4,1,power_law_1.2,0.27383038997650144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,8,1,balanced,0.14482133587201437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,8,1,balanced,0.1507306694984436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,8,1,power_law_1.01,0.14265600442886353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,8,1,power_law_1.01,0.1448192000389099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,8,1,power_law_1.2,0.14176000356674195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,16384,2,8,8,1,power_law_1.2,0.14226560592651366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,1,balanced,3.121429443359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,1,balanced,3.1719627380371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,1,power_law_1.01,2.4828224182128906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,1,power_law_1.01,2.496780776977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,1,power_law_1.2,2.451257514953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,1,power_law_1.2,2.4742015838623046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,128,balanced,0.10313066840171814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,128,balanced,0.10413333773612976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,128,power_law_1.01,0.10202879905700683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,128,power_law_1.01,0.10224000215530396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,128,power_law_1.2,0.10196479558944702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,128,power_law_1.2,0.10209280252456665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,16,balanced,0.24896534283955893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,16,balanced,0.2525866627693176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,16,power_law_1.01,0.22954239845275878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,16,power_law_1.01,0.23016319274902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,16,power_law_1.2,0.22088959217071533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,16,power_law_1.2,0.22540159225463868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,2,balanced,1.585370699564616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,2,balanced,1.6161920229593914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,2,power_law_1.01,1.2998208045959472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,2,power_law_1.01,1.330662441253662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,2,power_law_1.2,1.2939200401306152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,2,power_law_1.2,1.3471808433532715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,256,balanced,0.09058133761088054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,256,balanced,0.09359467029571533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,256,power_law_1.01,0.08658559918403626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,256,power_law_1.01,0.09373440146446228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,256,power_law_1.2,0.08487679958343505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,256,power_law_1.2,0.09382399916648865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,32,balanced,0.1518880029519399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,32,balanced,0.15284799536069235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,32,power_law_1.01,0.1422719955444336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,32,power_law_1.01,0.15011199712753295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,32,power_law_1.2,0.13589119911193848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,32,power_law_1.2,0.13878400325775148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,4,balanced,0.8289493719736735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,4,balanced,0.8318933645884196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,4,power_law_1.01,0.6889920234680176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,4,power_law_1.01,0.6904895782470704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,4,power_law_1.2,0.6665728092193604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,4,power_law_1.2,0.6842432022094727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,64,balanced,0.11700266599655151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,64,balanced,0.11931733290354411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,64,power_law_1.01,0.11478400230407715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,64,power_law_1.01,0.11643520593643189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,64,power_law_1.2,0.10885759592056274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,64,power_law_1.2,0.11642240285873413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,8,balanced,0.43086401621500653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,8,balanced,0.43134931723276776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,8,power_law_1.01,0.39105920791625975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,8,power_law_1.01,0.4086912155151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,8,power_law_1.2,0.3942591905593872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,1,8,power_law_1.2,0.39790079593658445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,16,1,balanced,0.25884799162546795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,16,1,balanced,0.2590773304303487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,16,1,power_law_1.01,0.20741760730743408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,16,1,power_law_1.01,0.20873599052429198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,16,1,power_law_1.2,0.21325440406799318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,16,1,power_law_1.2,0.21344640254974365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,2,1,balanced,1.59441073735555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,2,1,balanced,1.6055787404378254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,2,1,power_law_1.01,1.2773695945739747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,2,1,power_law_1.01,1.2851263999938964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,2,1,power_law_1.2,1.2576128005981446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,2,1,power_law_1.2,1.2827584266662597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,32,1,balanced,0.18117332458496094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,32,1,balanced,0.18278932571411133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,32,1,power_law_1.01,0.15633280277252198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,32,1,power_law_1.01,0.15749759674072267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,32,1,power_law_1.2,0.15748480558395386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,32,1,power_law_1.2,0.15826560258865358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,4,1,balanced,0.8061920007069906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,4,1,balanced,0.8089493115743002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,4,1,power_law_1.01,0.6318592071533203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,4,1,power_law_1.01,0.6381440162658691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,4,1,power_law_1.2,0.6339072227478028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,4,1,power_law_1.2,0.6429823875427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,8,1,balanced,0.429418683052063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,8,1,balanced,0.43373334407806396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,8,1,power_law_1.01,0.3764031887054443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,8,1,power_law_1.01,0.3796351909637451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,8,1,power_law_1.2,0.37766399383544924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2048,8,256,8,1,power_law_1.2,0.37906560897827146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,1,balanced,2.464207967122396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,1,balanced,2.4687840143839517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,1,power_law_1.01,2.190847969055176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,1,power_law_1.01,2.216953659057617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,1,power_law_1.2,2.1877504348754884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,1,power_law_1.2,2.2257152557373048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,16,balanced,0.1973386605580648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,16,balanced,0.19895466168721518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,16,power_law_1.01,0.1888383984565735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,16,power_law_1.01,0.18984960317611693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,16,power_law_1.2,0.1913856029510498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,16,power_law_1.2,0.1926144003868103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,2,balanced,1.2802026271820068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,2,balanced,1.2882293065388997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,2,power_law_1.01,1.1179007530212401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,2,power_law_1.01,1.1240127563476563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,2,power_law_1.2,1.1424384117126465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,2,power_law_1.2,1.1480192184448241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,32,balanced,0.1378773351510366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,32,balanced,0.1386240025361379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,32,power_law_1.01,0.1309183955192566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,32,power_law_1.01,0.134169602394104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,32,power_law_1.2,0.13320959806442262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,32,power_law_1.2,0.13485440015792846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,4,balanced,0.6622080008188883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,4,balanced,0.665450652440389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,4,power_law_1.01,0.6112256050109863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,4,power_law_1.01,0.6155200004577637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,4,power_law_1.2,0.6105279922485352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,4,power_law_1.2,0.6224256038665772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,8,balanced,0.38000531991322833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,8,balanced,0.3803946574529012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,8,power_law_1.01,0.37713921070098877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,8,power_law_1.01,0.37720959186553954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,8,power_law_1.2,0.36876161098480226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,1,8,power_law_1.2,0.3691200017929077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,16,1,balanced,0.2116533319155375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,16,1,balanced,0.2124533255894979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,16,1,power_law_1.01,0.19137920141220094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,16,1,power_law_1.01,0.19538559913635253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,16,1,power_law_1.2,0.19217920303344727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,16,1,power_law_1.2,0.19827200174331666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,2,1,balanced,1.2476800282796223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,2,1,balanced,1.2582133611043294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,2,1,power_law_1.01,1.1005248069763183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,2,1,power_law_1.01,1.1096192359924317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,2,1,power_law_1.2,1.1215231895446778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,2,1,power_law_1.2,1.1520447731018066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,32,1,balanced,0.16235733032226562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,32,1,balanced,0.1625333329041799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,32,1,power_law_1.01,0.14858880043029785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,32,1,power_law_1.01,0.15160319805145264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,32,1,power_law_1.2,0.1518720030784607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,32,1,power_law_1.2,0.15593600273132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,4,1,balanced,0.6332053343454996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,4,1,balanced,0.6402399937311808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,4,1,power_law_1.01,0.5772607803344727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,4,1,power_law_1.01,0.5831232070922852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,4,1,power_law_1.2,0.5884352207183838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,4,1,power_law_1.2,0.5915840148925782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,8,1,balanced,0.38021334012349445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,8,1,balanced,0.3803573449452718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,8,1,power_law_1.01,0.345414400100708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,8,1,power_law_1.01,0.35589120388031004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,8,1,power_law_1.2,0.3624000072479248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,6144,2560,8,160,8,1,power_law_1.2,0.366483211517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,1,balanced,3.6625919342041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,1,balanced,3.6693547566731772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,1,power_law_1.01,2.8636608123779297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,1,power_law_1.01,2.930611228942871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,1,power_law_1.2,2.839059257507324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,1,power_law_1.2,2.8836992263793944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,128,balanced,0.1153546671072642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,128,balanced,0.11732266346613567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,128,power_law_1.01,0.11438720226287842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,128,power_law_1.01,0.11463680267333984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,128,power_law_1.2,0.11469440460205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,128,power_law_1.2,0.11590399742126464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,16,balanced,0.27958399057388306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,16,balanced,0.27962666749954224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,16,power_law_1.01,0.24895360469818115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,16,power_law_1.01,0.25303680896759034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,16,power_law_1.2,0.2576832056045532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,16,power_law_1.2,0.25929598808288573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,2,balanced,1.8732746442159016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,2,balanced,1.892122745513916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,2,power_law_1.01,1.5496319770812987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,2,power_law_1.01,1.5808128356933593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,2,power_law_1.2,1.4698880195617676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,2,power_law_1.2,1.4840127944946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,256,balanced,0.10731732845306396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,256,balanced,0.1104693313439687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,256,power_law_1.01,0.10402560234069824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,256,power_law_1.01,0.10707839727401733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,256,power_law_1.2,0.101363205909729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,256,power_law_1.2,0.10677759647369385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,32,balanced,0.17285333077112833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,32,balanced,0.17287999391555786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,32,power_law_1.01,0.15903359651565552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,32,power_law_1.01,0.1597632050514221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,32,power_law_1.2,0.16101759672164917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,32,power_law_1.2,0.16212480068206786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,4,balanced,0.9711306889851888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,4,balanced,0.9750613371531168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,4,power_law_1.01,0.7787712097167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,4,power_law_1.01,0.8310720443725585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,4,power_law_1.2,0.7873472213745117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,4,power_law_1.2,0.8301631927490234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,64,balanced,0.13226133584976196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,64,balanced,0.13362133502960205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,64,power_law_1.01,0.1245695948600769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,64,power_law_1.01,0.12951680421829223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,64,power_law_1.2,0.13070080280303956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,64,power_law_1.2,0.13085440397262574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,8,balanced,0.5085119803746542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,8,balanced,0.5107200145721436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,8,power_law_1.01,0.4491583824157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,8,power_law_1.01,0.4726399898529053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,8,power_law_1.2,0.4299456119537354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,1,8,power_law_1.2,0.4386879920959473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,16,1,balanced,0.30001066128412884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,16,1,balanced,0.30081067482630414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,16,1,power_law_1.01,0.24243199825286865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,16,1,power_law_1.01,0.24274559020996095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,16,1,power_law_1.2,0.24578559398651123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,16,1,power_law_1.2,0.24637439250946044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,2,1,balanced,1.861738681793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,2,1,balanced,1.878053347269694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,2,1,power_law_1.01,1.4706815719604491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,2,1,power_law_1.01,1.4962559700012208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,2,1,power_law_1.2,1.490668773651123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,2,1,power_law_1.2,1.5138943672180176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,32,1,balanced,0.20868800083796182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,32,1,balanced,0.20935465892155966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,32,1,power_law_1.01,0.17916159629821776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,32,1,power_law_1.01,0.18227200508117675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,32,1,power_law_1.2,0.1796223998069763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,32,1,power_law_1.2,0.1832383990287781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,4,1,balanced,0.944917360941569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,4,1,balanced,0.9458773136138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,4,1,power_law_1.01,0.747756814956665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,4,1,power_law_1.01,0.752019214630127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,4,1,power_law_1.2,0.7313536167144775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,4,1,power_law_1.2,0.7543551921844482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,8,1,balanced,0.5025013287862142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,8,1,balanced,0.5047093232472738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,8,1,power_law_1.01,0.43751678466796873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,8,1,power_law_1.01,0.4424384117126465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,8,1,power_law_1.2,0.43653120994567873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,256,8,1,power_law_1.2,0.44007039070129395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,1,balanced,5.4765974680582685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,1,balanced,5.533103942871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,1,power_law_1.01,3.8959808349609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,1,power_law_1.01,3.897945785522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,1,power_law_1.2,3.7819393157958983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,1,power_law_1.2,3.8514942169189452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,128,balanced,0.12185600399971008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,128,balanced,0.12187199791272481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,128,power_law_1.01,0.11912319660186768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,128,power_law_1.01,0.11920640468597413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,128,power_law_1.2,0.11923840045928955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,128,power_law_1.2,0.11957119703292847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,16,balanced,0.4442986647288005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,16,balanced,0.4457919994990031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,16,power_law_1.01,0.3331712007522583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,16,power_law_1.01,0.3602880001068115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,16,power_law_1.2,0.355187201499939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,16,power_law_1.2,0.38899199962615966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,2,balanced,2.7622451782226562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,2,balanced,2.8051093419392905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,2,power_law_1.01,2.084275245666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,2,power_law_1.01,2.149068832397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,2,power_law_1.2,2.1068159103393556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,2,power_law_1.2,2.1650304794311523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,32,balanced,0.23634666204452515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,32,balanced,0.23864533503850302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,32,power_law_1.01,0.2034303903579712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,32,power_law_1.01,0.20805120468139648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,32,power_law_1.2,0.20176639556884765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,32,power_law_1.2,0.20482559204101564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,4,balanced,1.410373369852702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,4,balanced,1.4132426579793294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,4,power_law_1.01,1.0202943801879882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,4,power_law_1.01,1.0783743858337402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,4,power_law_1.2,1.0092351913452149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,4,power_law_1.2,1.0562560081481933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,64,balanced,0.14844266573588052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,64,balanced,0.149317334095637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,64,power_law_1.01,0.14043519496917725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,64,power_law_1.01,0.1434880018234253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,64,power_law_1.2,0.13999999761581422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,64,power_law_1.2,0.1427135944366455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,8,balanced,0.731269359588623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,8,balanced,0.7321173350016276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,8,power_law_1.01,0.5901247978210449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,8,power_law_1.01,0.6703551769256592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,8,power_law_1.2,0.6108352184295655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,1,8,power_law_1.2,0.6392576217651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,16,1,balanced,0.47645334402720135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,16,1,balanced,0.47939733664194745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,16,1,power_law_1.01,0.3221184015274048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,16,1,power_law_1.01,0.3243904113769531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,16,1,power_law_1.2,0.30512640476226804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,16,1,power_law_1.2,0.3096575975418091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,2,1,balanced,2.783594767252604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,2,1,balanced,2.797978719075521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,2,1,power_law_1.01,1.9767168045043946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,2,1,power_law_1.01,1.9939903259277343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,2,1,power_law_1.2,1.9306047439575196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,2,1,power_law_1.2,1.955526351928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,32,1,balanced,0.2847413420677185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,32,1,balanced,0.2851253350575765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,32,1,power_law_1.01,0.22109439373016357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,32,1,power_law_1.01,0.22216320037841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,32,1,power_law_1.2,0.21721599102020264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,32,1,power_law_1.2,0.21766400337219238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,4,1,balanced,1.3809439341227214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,4,1,balanced,1.3971467018127441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,4,1,power_law_1.01,0.9859583854675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,4,1,power_law_1.01,0.9875840187072754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,4,1,power_law_1.2,0.958521556854248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,4,1,power_law_1.2,0.9677120208740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,8,1,balanced,0.7381333510080973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,8,1,balanced,0.7395946979522705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,8,1,power_law_1.01,0.533184003829956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,8,1,power_law_1.01,0.5390463829040527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,8,1,power_law_1.2,0.5177343845367431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,float16,96,7168,2048,8,384,8,1,power_law_1.2,0.5288576126098633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,1,balanced,0.025493333737055462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,1,balanced,0.02717333287000656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,1,power_law_1.01,0.024723200500011443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,1,power_law_1.01,0.024985599517822265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,1,power_law_1.2,0.024460799992084503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,1,power_law_1.2,0.024659200012683867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,128,balanced,0.02739199995994568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,128,balanced,0.027701333165168762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,128,power_law_1.01,0.0265855997800827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,128,power_law_1.01,0.026822400093078614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,128,power_law_1.2,0.026572799682617186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,128,power_law_1.2,0.026700800657272337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,16,balanced,0.027327999472618103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,16,balanced,0.02743999908367793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,16,power_law_1.01,0.029734399914741517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,16,power_law_1.01,0.029791998863220214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,16,power_law_1.2,0.02873600125312805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,16,power_law_1.2,0.029862400889396668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,2,balanced,0.027461332579453785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,2,balanced,0.027493332823117573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,2,power_law_1.01,0.029721599817276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,2,power_law_1.01,0.02993920147418976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,2,power_law_1.2,0.02995840013027191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,2,power_law_1.2,0.03017599880695343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,32,balanced,0.027477333943049114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,32,balanced,0.029498666524887085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,32,power_law_1.01,0.027027198672294618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,32,power_law_1.01,0.02707839906215668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,32,power_law_1.2,0.027616000175476073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,32,power_law_1.2,0.02768000066280365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,4,balanced,0.02923733244339625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,4,balanced,0.029290666182835896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,4,power_law_1.01,0.029900801181793214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,4,power_law_1.01,0.030272001028060914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,4,power_law_1.2,0.02834559977054596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,4,power_law_1.2,0.030079999566078187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,64,balanced,0.027402666707833607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,64,balanced,0.02924266705910365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,64,power_law_1.01,0.02622080147266388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,64,power_law_1.01,0.028358399868011475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,64,power_law_1.2,0.026867198944091796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,64,power_law_1.2,0.02736639976501465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,8,balanced,0.027376001079877216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,8,balanced,0.029498666524887085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,8,power_law_1.01,0.028838399052619933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,8,power_law_1.01,0.02969599962234497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,8,power_law_1.2,0.02951039969921112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,1,8,power_law_1.2,0.030099201202392577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,2,1,balanced,0.021231998999913532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,2,1,balanced,0.023285334308942158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,2,1,power_law_1.01,0.020953600108623505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,2,1,power_law_1.01,0.021376000344753267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,2,1,power_law_1.2,0.021190400421619415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,2,1,power_law_1.2,0.02192640006542206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,4,1,balanced,0.023130667706330616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,4,1,balanced,0.023354666928450268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,4,1,power_law_1.01,0.021004800498485566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,4,1,power_law_1.01,0.02149759978055954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,4,1,power_law_1.2,0.02091519981622696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2048,768,8,128,4,1,power_law_1.2,0.02136960029602051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,1,balanced,0.03558400024970373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,1,balanced,0.035599999129772186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,1,power_law_1.01,0.03330560028553009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,1,power_law_1.01,0.03565439879894257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,1,power_law_1.2,0.033395200967788696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,1,power_law_1.2,0.034176000952720643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,128,balanced,0.03102933367093404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,128,balanced,0.0313226655125618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,128,power_law_1.01,0.03020159900188446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,128,power_law_1.01,0.030239999294281006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,128,power_law_1.2,0.029894399642944335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,128,power_law_1.2,0.030931198596954347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,16,balanced,0.03142400085926056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,16,balanced,0.03323733309904734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,16,power_law_1.01,0.03858560025691986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,16,power_law_1.01,0.040633600950241086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,16,power_law_1.2,0.03902080059051514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,16,power_law_1.2,0.03935999870300293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,2,balanced,0.03359466542800268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,2,balanced,0.03435199956099192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,2,power_law_1.01,0.038380798697471616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,2,power_law_1.01,0.04035840034484863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,2,power_law_1.2,0.03873920142650604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,2,power_law_1.2,0.041766399145126344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,32,balanced,0.031210665901501972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,32,balanced,0.03189333279927572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,32,power_law_1.01,0.034380799531936644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,32,power_law_1.01,0.034841600060462954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,32,power_law_1.2,0.03454079926013946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,32,power_law_1.2,0.03496319949626923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,4,balanced,0.03345066557327906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,4,balanced,0.035402665535608925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,4,power_law_1.01,0.03886080086231232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,4,power_law_1.01,0.03894400000572205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,4,power_law_1.2,0.03866240084171295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,4,power_law_1.2,0.04030719995498657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,64,balanced,0.03162666658560435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,64,balanced,0.03170666595300039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,64,power_law_1.01,0.03160960078239441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,64,power_law_1.01,0.03244799971580505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,64,power_law_1.2,0.032927998900413515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,64,power_law_1.2,0.03320960104465485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,8,balanced,0.03143466760714849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,8,balanced,0.03161599983771642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,8,power_law_1.01,0.03885439932346344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,8,power_law_1.01,0.03961600065231323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,8,power_law_1.2,0.03933440148830414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,1,8,power_law_1.2,0.03980799913406372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,16,1,balanced,0.029461334149042766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,16,1,balanced,0.02959999938805898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,16,1,power_law_1.01,0.028505599498748778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,16,1,power_law_1.01,0.028838399052619933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,16,1,power_law_1.2,0.02876160144805908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,16,1,power_law_1.2,0.02885119915008545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,2,1,balanced,0.02941333254178365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,2,1,balanced,0.02959999938805898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,2,1,power_law_1.01,0.026815998554229736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,2,1,power_law_1.01,0.027065598964691163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,2,1,power_law_1.2,0.026918399333953857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,2,1,power_law_1.2,0.02710399925708771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,32,1,balanced,0.029338667790095013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,32,1,balanced,0.02943466603755951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,32,1,power_law_1.01,0.028518399596214293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,32,1,power_law_1.01,0.02858240008354187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,32,1,power_law_1.2,0.028012800216674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,32,1,power_law_1.2,0.02813439965248108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,4,1,balanced,0.02346133440732956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,4,1,balanced,0.023797333240509033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,4,1,power_law_1.01,0.022963200509548188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,4,1,power_law_1.01,0.023423999547958374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,4,1,power_law_1.2,0.022681599855422972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,4,1,power_law_1.2,0.022726400196552275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,8,1,balanced,0.031328000128269196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,8,1,balanced,0.03146133323510488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,8,1,power_law_1.01,0.029395198822021483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,8,1,power_law_1.01,0.030022400617599487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,8,1,power_law_1.2,0.029900801181793214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,2688,1856,6,128,8,1,power_law_1.2,0.02995840013027191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,1,balanced,0.04359466830889384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,1,balanced,0.057434668143590294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,1,power_law_1.01,0.041555199027061465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,1,power_law_1.01,0.04178560078144074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,1,power_law_1.2,0.0412992000579834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,1,power_law_1.2,0.04924159944057464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,128,balanced,0.03140799949566523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,128,balanced,0.03149333347876867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,128,power_law_1.01,0.029471999406814574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,128,power_law_1.01,0.030297601222991945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,128,power_law_1.2,0.030239999294281006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,128,power_law_1.2,0.030880001187324525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,16,balanced,0.031285333136717476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,16,balanced,0.03133333226044973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,16,power_law_1.01,0.046854400634765626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,16,power_law_1.01,0.048390400409698484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,16,power_law_1.2,0.04734080135822296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,16,power_law_1.2,0.04784640073776245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,2,balanced,0.037717332442601524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,2,balanced,0.04113066693147024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,2,power_law_1.01,0.04984959959983826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,2,power_law_1.01,0.061318397521972656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,2,power_law_1.2,0.0474368005990982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,2,power_law_1.2,0.047443199157714847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,256,balanced,0.02998399982849757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,256,balanced,0.03136533250411352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,256,power_law_1.01,0.02948479950428009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,256,power_law_1.01,0.02967039942741394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,256,power_law_1.2,0.029100799560546876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,256,power_law_1.2,0.029580798745155335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,32,balanced,0.031397332747777305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,32,balanced,0.031583999594052635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,32,power_law_1.01,0.047814399003982544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,32,power_law_1.01,0.04833920001983642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,32,power_law_1.2,0.04704639911651611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,32,power_law_1.2,0.048230400681495665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,4,balanced,0.031248000760873158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,4,balanced,0.03156266609827677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,4,power_law_1.01,0.047091200947761536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,4,power_law_1.01,0.04903680086135864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,4,power_law_1.2,0.04636160135269165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,4,power_law_1.2,0.04725759923458099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,64,balanced,0.030533333619435627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,64,balanced,0.031370667119820915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,64,power_law_1.01,0.033523198962211606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,64,power_law_1.01,0.034457600116729735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,64,power_law_1.2,0.034176000952720643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,64,power_law_1.2,0.03480960130691528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,8,balanced,0.03141333411137263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,8,balanced,0.03162133445342382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,8,power_law_1.01,0.04620159864425659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,8,power_law_1.01,0.047891199588775635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,8,power_law_1.2,0.04796159863471985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,1,8,power_law_1.2,0.048019200563430786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,16,1,balanced,0.02330133318901062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,16,1,balanced,0.023354666928450268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,16,1,power_law_1.01,0.022329600155353548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,16,1,power_law_1.01,0.022918400168418885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,16,1,power_law_1.2,0.0219200000166893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,16,1,power_law_1.2,0.02210559993982315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,2,1,balanced,0.031210665901501972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,2,1,balanced,0.03146133323510488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,2,1,power_law_1.01,0.031251201033592226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,2,1,power_law_1.01,0.036134400963783266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,2,1,power_law_1.2,0.028326401114463808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,2,1,power_law_1.2,0.028332799673080444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,32,1,balanced,0.023269332945346832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,32,1,balanced,0.02332266668478648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,32,1,power_law_1.01,0.021478399634361267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,32,1,power_law_1.01,0.022015999257564544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,32,1,power_law_1.2,0.021830399334430695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,32,1,power_law_1.2,0.02285439968109131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,4,1,balanced,0.02521066615978877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,4,1,balanced,0.02533866713444392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,4,1,power_law_1.01,0.023526400327682495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,4,1,power_law_1.01,0.02595199942588806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,4,1,power_law_1.2,0.02332800030708313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,4,1,power_law_1.2,0.024403199553489685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,8,1,balanced,0.023647998770078022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,8,1,balanced,0.025263999899228413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,8,1,power_law_1.01,0.023014399409294128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,8,1,power_law_1.01,0.023379200696945192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,8,1,power_law_1.2,0.02338559925556183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,3072,1536,8,256,8,1,power_law_1.2,0.023577600717544556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,1,balanced,0.10053867101669312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,1,balanced,0.1037066678206126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,1,power_law_1.01,0.09939200282096863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,1,power_law_1.01,0.10042239427566528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,1,power_law_1.2,0.10175360441207885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,1,power_law_1.2,0.10245120525360107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,2,balanced,0.09470400214195251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,2,balanced,0.09724799791971843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,2,power_law_1.01,0.09035519957542419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,2,power_law_1.01,0.09047679901123047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,2,power_law_1.2,0.09089279770851136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,2,power_law_1.2,0.11804159879684448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,4,balanced,0.09147733449935913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,4,balanced,0.10318400462468465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,4,power_law_1.01,0.08435840010643006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,4,power_law_1.01,0.08881279826164246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,4,power_law_1.2,0.08570880293846131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,4,power_law_1.2,0.10743039846420288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,8,balanced,0.08716266353925069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,8,balanced,0.09019733468691508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,8,power_law_1.01,0.08485119938850402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,8,power_law_1.01,0.08566399812698364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,8,power_law_1.2,0.08577280044555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,1,8,power_law_1.2,0.08684160113334656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,16,1,balanced,0.024010665714740753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,16,1,balanced,0.025290665527184803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,16,1,power_law_1.01,0.023660799860954283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,16,1,power_law_1.01,0.023999999463558196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,16,1,power_law_1.2,0.023904000222682954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,16,1,power_law_1.2,0.023974399268627166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,2,1,balanced,0.06673066814740498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,2,1,balanced,0.0722453345855077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,2,1,power_law_1.01,0.061504000425338747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,2,1,power_law_1.01,0.0716863989830017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,2,1,power_law_1.2,0.06751360297203064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,2,1,power_law_1.2,0.0680512011051178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,32,1,balanced,0.02497066557407379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,32,1,balanced,0.025392000873883564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,32,1,power_law_1.01,0.0225600004196167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,32,1,power_law_1.01,0.022598400712013245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,32,1,power_law_1.2,0.022944000363349915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,32,1,power_law_1.2,0.02336000055074692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,4,1,balanced,0.037647999823093414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,4,1,balanced,0.041034666200478874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,4,1,power_law_1.01,0.04067200124263763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,4,1,power_law_1.01,0.04090240001678467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,4,1,power_law_1.2,0.040550398826599124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,4,1,power_law_1.2,0.04185599982738495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,8,1,balanced,0.02934933453798294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,8,1,balanced,0.029482667644818623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,8,1,power_law_1.01,0.03139840066432953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,8,1,power_law_1.01,0.03266560137271881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,8,1,power_law_1.2,0.031974399089813234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,14336,2,8,8,1,power_law_1.2,0.03518719971179962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,1,balanced,0.0510506679614385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,1,balanced,0.051407997806866966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,1,power_law_1.01,0.04802559912204742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,1,power_law_1.01,0.048537600040435794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,1,power_law_1.2,0.05783680081367493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,1,power_law_1.2,0.058246397972106935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,128,balanced,0.033439998825391136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,128,power_law_1.01,0.03203839957714081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,128,power_law_1.01,0.032307198643684386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,128,power_law_1.2,0.031814399361610415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,128,power_law_1.2,0.031891199946403506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,16,balanced,0.031712000568707786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,16,balanced,0.033733333150545754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,16,power_law_1.01,0.05397120118141174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,16,power_law_1.01,0.05454720258712768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,16,power_law_1.2,0.0541375994682312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,16,power_law_1.2,0.05436800122261047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,2,balanced,0.03977599988381068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,2,balanced,0.043621331453323364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,2,power_law_1.01,0.053887999057769774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,2,power_law_1.01,0.05392640233039856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,2,power_law_1.2,0.055078399181365964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,2,power_law_1.2,0.057062399387359616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,32,balanced,0.03155199935038885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,32,balanced,0.03345600018898646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,32,power_law_1.01,0.038176000118255615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,32,power_law_1.01,0.03852159976959228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,32,power_law_1.2,0.038489601016044615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,32,power_law_1.2,0.03859840035438537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,4,balanced,0.03355200091997782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,4,balanced,0.0354666660229365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,4,power_law_1.01,0.054841601848602296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,4,power_law_1.01,0.05856639742851257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,4,power_law_1.2,0.05489280223846436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,4,power_law_1.2,0.05566080212593079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,64,balanced,0.032144000132878624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,64,balanced,0.0352906659245491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,64,power_law_1.01,0.033344000577926636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,64,power_law_1.01,0.0336896002292633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,64,power_law_1.2,0.032927998900413515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,64,power_law_1.2,0.03320319950580597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,8,balanced,0.03352533280849457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,8,balanced,0.033546666304270424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,8,power_law_1.01,0.05416960120201111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,8,power_law_1.01,0.05454720258712768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,8,power_law_1.2,0.053273600339889524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,1,8,power_law_1.2,0.05495679974555969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,16,1,balanced,0.02517866591612498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,16,1,balanced,0.025631998976071674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,16,1,power_law_1.01,0.024435199797153473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,16,1,power_law_1.01,0.02460159957408905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,16,1,power_law_1.2,0.023628799617290495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,16,1,power_law_1.2,0.02421119958162308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,2,1,balanced,0.033728001018365227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,2,1,balanced,0.035690667728583016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,2,1,power_law_1.01,0.03208320140838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,2,1,power_law_1.01,0.0322816014289856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,2,1,power_law_1.2,0.031999999284744264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,2,1,power_law_1.2,0.03391999900341034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,32,1,balanced,0.02510933329661687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,32,1,balanced,0.025402667621771496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,32,1,power_law_1.01,0.024083200097084045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,32,1,power_law_1.01,0.02423679977655411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,32,1,power_law_1.2,0.023756800591945647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,32,1,power_law_1.2,0.023788799345493317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,4,1,balanced,0.027434666951497395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,4,1,balanced,0.029093332588672638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,4,1,power_law_1.01,0.025702399015426636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,4,1,power_law_1.01,0.026240000128746034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,4,1,power_law_1.2,0.02597759962081909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,4,1,power_law_1.2,0.026182401180267333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,8,1,balanced,0.027221334477265675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,8,1,balanced,0.027295999228954315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,8,1,power_law_1.01,0.02526719868183136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,8,1,power_law_1.01,0.025407999753952026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,8,1,power_law_1.2,0.025465598702430724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,1536,8,128,8,1,power_law_1.2,0.025472000241279602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,1,balanced,0.14985066652297974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,1,balanced,0.15059199929237366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,1,power_law_1.01,0.14621440172195435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,1,power_law_1.01,0.14697599411010742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,1,power_law_1.2,0.14587520360946654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,1,power_law_1.2,0.14863359928131104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,128,balanced,0.037871999045213066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,128,balanced,0.03945599993069967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,128,power_law_1.01,0.05715199708938599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,128,power_law_1.01,0.059084802865982056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,128,power_law_1.2,0.05741440057754517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,128,power_law_1.2,0.057548797130584715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,16,balanced,0.04203199843565623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,16,balanced,0.042463997999827065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,16,power_law_1.01,0.1512063980102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,16,power_law_1.01,0.15171200037002563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,16,power_law_1.2,0.1524224042892456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,16,power_law_1.2,0.15253119468688964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,2,balanced,0.09498133261998494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,2,balanced,0.09616532921791077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,2,power_law_1.01,0.15204479694366455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,2,power_law_1.01,0.15263999700546266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,2,power_law_1.2,0.1513152003288269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,2,power_law_1.2,0.15271040201187133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,256,balanced,0.03774933268626531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,256,balanced,0.037920000652472176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,256,power_law_1.01,0.041126400232315063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,256,power_law_1.01,0.04132480025291443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,256,power_law_1.2,0.04103679955005646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,256,power_law_1.2,0.041715198755264284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,32,balanced,0.037765334049860634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,32,balanced,0.03787733366092046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,32,power_law_1.01,0.13165440559387206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,32,power_law_1.01,0.13177599906921386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,32,power_law_1.2,0.13070080280303956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,32,power_law_1.2,0.1318336009979248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,4,balanced,0.07041066884994507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,4,balanced,0.07101866602897644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,4,power_law_1.01,0.15229439735412598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,4,power_law_1.01,0.1527232050895691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,4,power_law_1.2,0.15259519815444947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,4,power_law_1.2,0.15304319858551024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,64,balanced,0.03562133262554804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,64,balanced,0.037471999724706016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,64,power_law_1.01,0.07650560140609741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,64,power_law_1.01,0.07749760150909424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,64,power_law_1.2,0.07672320008277893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,64,power_law_1.2,0.07690879702568054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,8,balanced,0.052015999952952065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,8,balanced,0.05418666700522105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,8,power_law_1.01,0.15425920486450195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,8,power_law_1.01,0.15551359653472902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,8,power_law_1.2,0.15260159969329834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,1,8,power_law_1.2,0.15415680408477783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,16,1,balanced,0.07654400169849396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,16,1,balanced,0.07990933458010356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,16,1,power_law_1.01,0.07409279942512512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,16,1,power_law_1.01,0.07420160174369812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,16,1,power_law_1.2,0.07356799840927124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,16,1,power_law_1.2,0.0743552029132843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,2,1,balanced,0.09773332873980205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,2,1,balanced,0.1002293328444163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,2,1,power_law_1.01,0.08862079977989197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,2,1,power_law_1.01,0.0893887996673584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,2,1,power_law_1.2,0.08872320055961609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,2,1,power_law_1.2,0.09159680008888245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,32,1,balanced,0.07044266661008199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,32,1,balanced,0.07060799996058147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,32,1,power_law_1.01,0.06841599941253662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,32,1,power_law_1.01,0.06844800114631652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,32,1,power_law_1.2,0.06859520077705383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,32,1,power_law_1.2,0.06872320175170898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,4,1,balanced,0.06797333558400472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,4,1,balanced,0.07032533486684163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,4,1,power_law_1.01,0.05958399772644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,4,1,power_law_1.01,0.059673601388931276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,4,1,power_law_1.2,0.058278399705886844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,4,1,power_law_1.2,0.06398079991340637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,8,1,balanced,0.041189332803090416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,8,1,balanced,0.05081599950790405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,8,1,power_law_1.01,0.03841919898986816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,8,1,power_law_1.01,0.040300801396369934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,8,1,power_law_1.2,0.038540801405906676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,4096,2688,22,512,8,1,power_law_1.2,0.0398144006729126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,1,balanced,0.1506239970525106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,1,balanced,0.15570666392644247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,1,power_law_1.01,0.15456000566482545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,1,power_law_1.01,0.1579200029373169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,1,power_law_1.2,0.14448000192642213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,1,power_law_1.2,0.1472383975982666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,2,balanced,0.11196266611417134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,2,balanced,0.12772799531618753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,2,power_law_1.01,0.12655359506607056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,2,power_law_1.01,0.15256960391998292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,2,power_law_1.2,0.1344383955001831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,2,power_law_1.2,0.14791040420532225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,4,balanced,0.12478400270144145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,4,balanced,0.13196266690889993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,4,power_law_1.01,0.10979199409484863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,4,power_law_1.01,0.12345600128173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,4,power_law_1.2,0.13363840579986572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,4,power_law_1.2,0.13432320356369018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,8,balanced,0.11162133018175761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,8,balanced,0.11377066373825073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,8,power_law_1.01,0.10924160480499268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,8,power_law_1.01,0.1129472017288208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,8,power_law_1.2,0.110316801071167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,1,8,power_law_1.2,0.11091840267181396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,16,1,balanced,0.03160000095764796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,16,1,balanced,0.032287999987602234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,16,1,power_law_1.01,0.03544319868087768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,16,1,power_law_1.01,0.03606399893760681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,16,1,power_law_1.2,0.029683199524879456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,16,1,power_law_1.2,0.0344895988702774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,2,1,balanced,0.0846666693687439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,2,1,balanced,0.09751466910044353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,2,1,power_law_1.01,0.08123520016670227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,2,1,power_law_1.01,0.0815999984741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,2,1,power_law_1.2,0.08008959889411926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,2,1,power_law_1.2,0.09759359955787658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,32,1,balanced,0.02935466667016347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,32,1,balanced,0.029359998802344005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,32,1,power_law_1.01,0.027859199047088622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,32,1,power_law_1.01,0.027987200021743774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,32,1,power_law_1.2,0.027193599939346315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,32,1,power_law_1.2,0.027935999631881713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,4,1,balanced,0.05904533465703329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,4,1,balanced,0.06838933130105336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,4,1,power_law_1.01,0.05397760272026062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,4,1,power_law_1.01,0.055871999263763426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,4,1,power_law_1.2,0.061952000856399535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,4,1,power_law_1.2,0.06682239770889283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,8,1,balanced,0.04111466556787491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,8,1,balanced,0.045312002301216125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,8,1,power_law_1.01,0.040575999021530154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,8,1,power_law_1.01,0.040863999724388124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,8,1,power_law_1.2,0.04074240028858185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,16384,2,8,8,1,power_law_1.2,0.04151679873466492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,1,balanced,0.07442133128643036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,1,balanced,0.08442133665084839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,1,power_law_1.01,0.07339519858360291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,1,power_law_1.01,0.0737600028514862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,1,power_law_1.2,0.07459200024604798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,1,power_law_1.2,0.07634559869766236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,128,balanced,0.03779733429352442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,128,balanced,0.03791466603676478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,128,power_law_1.01,0.04220159947872162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,128,power_law_1.01,0.0430976003408432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,128,power_law_1.2,0.04237439930438995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,128,power_law_1.2,0.04344319999217987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,16,balanced,0.03766933331886927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,16,balanced,0.03775999943415324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,16,power_law_1.01,0.07971839904785157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,16,power_law_1.01,0.08082559704780579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,16,power_law_1.2,0.07901440262794494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,16,power_law_1.2,0.08057600259780884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,2,balanced,0.06391466657320659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,2,balanced,0.06842666864395142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,2,power_law_1.01,0.07935360074043274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,2,power_law_1.01,0.08013439774513245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,2,power_law_1.2,0.0803264021873474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,2,power_law_1.2,0.08126720190048217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,256,balanced,0.03566399961709976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,256,balanced,0.037733333806196846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,256,power_law_1.01,0.03568640053272247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,256,power_law_1.01,0.03608959913253784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,256,power_law_1.2,0.03683840036392212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,256,power_law_1.2,0.03701759874820709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,32,balanced,0.0359946663180987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,32,balanced,0.0379573330283165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,32,power_law_1.01,0.07825279831886292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,32,power_law_1.01,0.07854080200195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,32,power_law_1.2,0.07768959999084472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,32,power_law_1.2,0.07994239926338195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,4,balanced,0.043765331308046974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,4,balanced,0.05188799897829691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,4,power_law_1.01,0.07904639840126038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,4,power_law_1.01,0.08156160116195679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,4,power_law_1.2,0.08097919821739197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,4,power_law_1.2,0.0840448021888733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,64,balanced,0.03770133356253306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,64,balanced,0.037802666425704956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,64,power_law_1.01,0.06255360245704651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,64,power_law_1.01,0.063673597574234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,64,power_law_1.2,0.0615231990814209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,64,power_law_1.2,0.06340479850769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,8,balanced,0.037647999823093414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,8,balanced,0.03772799919048945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,8,power_law_1.01,0.07863039970397949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,8,power_law_1.01,0.07873280048370361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,8,power_law_1.2,0.07777919769287109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,1,8,power_law_1.2,0.08000640273094177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,16,1,balanced,0.029472000896930695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,16,1,balanced,0.02962133288383484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,16,1,power_law_1.01,0.028441599011421202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,16,1,power_law_1.01,0.028799998760223388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,16,1,power_law_1.2,0.02839039862155914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,16,1,power_law_1.2,0.028454399108886717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,2,1,balanced,0.0537013312180837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,2,1,balanced,0.05410666763782501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,2,1,power_law_1.01,0.050892800092697144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,2,1,power_law_1.01,0.0531328022480011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,2,1,power_law_1.2,0.05052800178527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,2,1,power_law_1.2,0.05438079833984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,32,1,balanced,0.02918400118748347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,32,1,balanced,0.02959999938805898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,32,1,power_law_1.01,0.028678399324417115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,32,1,power_law_1.01,0.028998398780822755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,32,1,power_law_1.2,0.028217598795890808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,32,1,power_law_1.2,0.02842240035533905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,4,1,balanced,0.03974399964014689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,4,1,balanced,0.039749334255854286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,4,1,power_law_1.01,0.0321727991104126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,4,1,power_law_1.01,0.03625600039958954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,4,1,power_law_1.2,0.03133440017700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,4,1,power_law_1.2,0.03251200020313263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,8,1,balanced,0.03154666721820831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,8,1,balanced,0.03169599920511246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,8,1,power_law_1.01,0.029580798745155335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,8,1,power_law_1.01,0.029683199524879456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,8,1,power_law_1.2,0.02968960106372833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2048,8,256,8,1,power_law_1.2,0.02993920147418976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,1,balanced,0.08768000205357869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,1,balanced,0.08954667051633199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,1,power_law_1.01,0.0865664005279541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,1,power_law_1.01,0.08727040290832519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,1,power_law_1.2,0.08564479947090149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,1,power_law_1.2,0.0867904007434845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,16,balanced,0.03774933268626531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,16,balanced,0.03985599925120672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,16,power_law_1.01,0.09240319728851318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,16,power_law_1.01,0.09349120259284974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,16,power_law_1.2,0.09292160272598267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,16,power_law_1.2,0.09296640157699584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,2,balanced,0.06633066634337108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,2,balanced,0.06902933120727539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,2,power_law_1.01,0.0949567973613739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,2,power_law_1.01,0.09610880017280579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,2,power_law_1.2,0.09049599766731262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,2,power_law_1.2,0.09105920195579528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,32,balanced,0.03777066618204117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,32,balanced,0.03966933240493139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,32,power_law_1.01,0.07209600210189819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,32,power_law_1.01,0.07269759774208069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,32,power_law_1.2,0.07154560089111328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,32,power_law_1.2,0.0723904013633728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,4,balanced,0.05197866757710775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,4,balanced,0.06248533229033152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,4,power_law_1.01,0.09151359796524047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,4,power_law_1.01,0.0923904001712799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,4,power_law_1.2,0.09028480052947999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,4,power_law_1.2,0.09394559860229493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,8,balanced,0.03950933367013931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,8,balanced,0.03961066653331121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,8,power_law_1.01,0.09164159893989562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,8,power_law_1.01,0.09225599765777588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,8,power_law_1.2,0.09155200123786926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,1,8,power_law_1.2,0.09200000166893005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,16,1,balanced,0.031504000226656594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,16,1,balanced,0.031530665854612984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,16,1,power_law_1.01,0.02971520125865936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,16,1,power_law_1.01,0.030060800909996032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,16,1,power_law_1.2,0.02930560111999512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,16,1,power_law_1.2,0.029817599058151244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,2,1,balanced,0.05962666869163513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,2,1,balanced,0.059903999169667564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,2,1,power_law_1.01,0.05743359923362732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,2,1,power_law_1.01,0.057843202352523805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,2,1,power_law_1.2,0.05772799849510193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,2,1,power_law_1.2,0.06002560257911682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,32,1,balanced,0.029311999678611755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,32,1,balanced,0.029648000995318096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,32,1,power_law_1.01,0.02861439883708954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,32,1,power_law_1.01,0.02911359965801239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,32,1,power_law_1.2,0.02815999984741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,32,1,power_law_1.2,0.029120001196861266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,4,1,balanced,0.04363200068473816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,4,1,balanced,0.04558933277924856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,4,1,power_law_1.01,0.04350079894065857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,4,1,power_law_1.01,0.04360319972038269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,4,1,power_law_1.2,0.04200960099697113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,4,1,power_law_1.2,0.04759680032730103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,8,1,balanced,0.031445334355036415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,8,1,balanced,0.03335466732581457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,8,1,power_law_1.01,0.03056640028953552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,8,1,power_law_1.01,0.031014400720596313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,8,1,power_law_1.2,0.03133440017700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,6144,2560,8,160,8,1,power_law_1.2,0.03134079873561859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,1,balanced,0.08463467160860698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,1,balanced,0.08564266562461853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,1,power_law_1.01,0.0811456024646759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,1,power_law_1.01,0.08419839739799499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,1,power_law_1.2,0.0818560004234314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,1,power_law_1.2,0.08618879914283753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,128,balanced,0.03998400022586187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,128,balanced,0.04176533222198486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,128,power_law_1.01,0.04717440009117126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,128,power_law_1.01,0.0480320006608963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,128,power_law_1.2,0.046700799465179445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,128,power_law_1.2,0.048614400625228885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,16,balanced,0.041519999504089355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,16,balanced,0.04186133543650309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,16,power_law_1.01,0.08810880184173583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,16,power_law_1.01,0.0881600022315979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,16,power_law_1.2,0.08850560188293458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,16,power_law_1.2,0.08901119828224183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,2,balanced,0.06651733318964641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,2,balanced,0.06869333485762279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,2,power_law_1.01,0.08728320002555848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,2,power_law_1.01,0.08802559971809387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,2,power_law_1.2,0.08643199801445008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,2,power_law_1.2,0.10245120525360107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,256,balanced,0.040031999349594116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,256,balanced,0.04174399872620901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,256,power_law_1.01,0.03964160084724426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,256,power_law_1.01,0.04004479944705963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,256,power_law_1.2,0.03891839981079102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,256,power_law_1.2,0.03963519930839539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,32,balanced,0.03977066775163015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,32,balanced,0.04177600145339966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,32,power_law_1.01,0.08698239922523499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,32,power_law_1.01,0.0886080026626587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,32,power_law_1.2,0.08501120209693909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,32,power_law_1.2,0.08766720294952393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,4,balanced,0.061199997862180076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,4,balanced,0.06754666566848755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,4,power_law_1.01,0.08674560189247131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,4,power_law_1.01,0.08776320219039917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,4,power_law_1.2,0.08809599876403809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,4,power_law_1.2,0.08844159841537476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,64,balanced,0.04155199974775314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,64,balanced,0.04166933397452036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,64,power_law_1.01,0.06725119948387145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,64,power_law_1.01,0.06775680184364319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,64,power_law_1.2,0.06572800278663635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,64,power_law_1.2,0.06644480228424073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,8,balanced,0.04604800045490265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,8,balanced,0.05218133330345154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,8,power_law_1.01,0.08756480216979981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,8,power_law_1.01,0.10004479885101318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,8,power_law_1.2,0.08752639889717102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,1,8,power_law_1.2,0.08794879913330078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,16,1,balanced,0.031957333286603294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,16,1,balanced,0.03339199970165888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,16,1,power_law_1.01,0.03043839931488037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,16,1,power_law_1.01,0.03080959916114807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,16,1,power_law_1.2,0.030048000812530517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,16,1,power_law_1.2,0.030713599920272828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,2,1,balanced,0.05818133552869161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,2,1,balanced,0.05919999877611796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,2,1,power_law_1.01,0.056441599130630495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,2,1,power_law_1.01,0.056467199325561525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,2,1,power_law_1.2,0.05736320018768311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,2,1,power_law_1.2,0.05790079832077026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,32,1,balanced,0.03149333347876867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,32,1,balanced,0.03158933420976003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,32,1,power_law_1.01,0.030105599761009218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,32,1,power_law_1.01,0.030316799879074097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,32,1,power_law_1.2,0.02968960106372833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,32,1,power_law_1.2,0.030015999078750612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,4,1,balanced,0.041536000867684685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,4,1,balanced,0.04549333453178406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,4,1,power_law_1.01,0.04136959910392761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,4,1,power_law_1.01,0.04346239864826203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,4,1,power_law_1.2,0.04002560079097748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,4,1,power_law_1.2,0.04630399942398071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,8,1,balanced,0.033530667424201965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,8,1,balanced,0.0355679988861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,8,1,power_law_1.01,0.031231999397277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,8,1,power_law_1.01,0.03203200101852417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,8,1,power_law_1.2,0.031615999341011045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,256,8,1,power_law_1.2,0.03190400004386902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,1,balanced,0.08251200119654338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,1,balanced,0.08286400139331818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,1,power_law_1.01,0.0806656002998352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,1,power_law_1.01,0.08305280208587647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,1,power_law_1.2,0.08283519744873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,1,power_law_1.2,0.08296319842338562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,128,balanced,0.03966933240493139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,128,balanced,0.04181866844495138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,128,power_law_1.01,0.05811840295791626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,128,power_law_1.01,0.058847999572753905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,128,power_law_1.2,0.058739197254180905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,128,power_law_1.2,0.05911039710044861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,16,balanced,0.04159999887148539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,16,balanced,0.04177066683769226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,16,power_law_1.01,0.08654720187187195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,16,power_law_1.01,0.08791040182113648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,16,power_law_1.2,0.08688639998435974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,16,power_law_1.2,0.08849920034408569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,2,balanced,0.06698133548100789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,2,balanced,0.06809600194295247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,2,power_law_1.01,0.08766720294952393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,2,power_law_1.01,0.08806399703025818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,2,power_law_1.2,0.08712319731712341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,2,power_law_1.2,0.0877888023853302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,32,balanced,0.04142933338880539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,32,balanced,0.042266666889190674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,32,power_law_1.01,0.08746880292892456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,32,power_law_1.01,0.08765439987182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,32,power_law_1.2,0.08768640160560608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,32,power_law_1.2,0.08815360069274902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,4,balanced,0.04976533353328705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,4,balanced,0.05413866539796194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,4,power_law_1.01,0.08722559809684753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,4,power_law_1.01,0.08818560242652893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,4,power_law_1.2,0.08721920251846313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,4,power_law_1.2,0.08792319893836975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,64,balanced,0.03979733337958654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,64,balanced,0.04167999823888143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,64,power_law_1.01,0.0751039981842041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,64,power_law_1.01,0.07560319900512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,64,power_law_1.2,0.07517439723014832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,64,power_law_1.2,0.07619839906692505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,8,balanced,0.041434665520985924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,8,balanced,0.04172799984614054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,8,power_law_1.01,0.0864575982093811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,8,power_law_1.01,0.0874176025390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,8,power_law_1.2,0.08731520175933838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,1,8,power_law_1.2,0.08861439824104309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,16,1,balanced,0.031194667021433514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,16,1,balanced,0.03154666721820831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,16,1,power_law_1.01,0.030630400776863097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,16,1,power_law_1.01,0.030982398986816408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,16,1,power_law_1.2,0.030105599761009218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,16,1,power_law_1.2,0.03020800054073334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,2,1,balanced,0.05860800047715505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,2,1,balanced,0.05876799921194712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,2,1,power_law_1.01,0.06577280163764954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,2,1,power_law_1.01,0.06711680293083191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,2,1,power_law_1.2,0.055820798873901366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,2,1,power_law_1.2,0.05690240263938904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,32,1,balanced,0.03143999973932902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,32,1,balanced,0.03213333338499069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,32,1,power_law_1.01,0.030630400776863097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,32,1,power_law_1.01,0.03086720108985901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,32,1,power_law_1.2,0.029875200986862183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,32,1,power_law_1.2,0.030995199084281923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,4,1,balanced,0.043568000197410583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,4,1,balanced,0.043605332573254905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,4,1,power_law_1.01,0.04392319917678833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,4,1,power_law_1.01,0.04636160135269165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,4,1,power_law_1.2,0.03587839901447296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,4,1,power_law_1.2,0.039750400185585025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,8,1,balanced,0.0335359995563825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,8,1,balanced,0.03357866654793421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,8,1,power_law_1.01,0.03244799971580505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,8,1,power_law_1.01,0.03445119857788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,8,1,power_law_1.2,0.03193599879741669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1,7168,2048,8,384,8,1,power_law_1.2,0.03219200074672699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,1,balanced,0.21663999557495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,1,balanced,0.21715199947357178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,1,power_law_1.01,0.2334144115447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,1,power_law_1.01,0.23379199504852294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,1,power_law_1.2,0.23720319271087648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,1,power_law_1.2,0.2374272108078003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,128,balanced,0.08780266841252644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,128,balanced,0.08904000123341878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,128,power_law_1.01,0.09101439714431762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,128,power_law_1.01,0.09244160056114196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,128,power_law_1.2,0.09219840168952942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,128,power_law_1.2,0.09249280095100403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,16,balanced,0.09921066959698994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,16,balanced,0.09999466935793559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,16,power_law_1.01,0.10419199466705323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,16,power_law_1.01,0.10533119440078735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,16,power_law_1.2,0.10606080293655396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,16,power_law_1.2,0.10607359409332276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,2,balanced,0.16266133387883505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,2,balanced,0.16346133748690286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,2,power_law_1.01,0.17427200078964233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,2,power_law_1.01,0.1751487970352173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,2,power_law_1.2,0.1766144037246704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,2,power_law_1.2,0.17706880569458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,32,balanced,0.09237333138783772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,32,balanced,0.09384000301361084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,32,power_law_1.01,0.09621760249137878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,32,power_law_1.01,0.09750400185585022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,32,power_law_1.2,0.09953280091285706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,32,power_law_1.2,0.09968000054359435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,4,balanced,0.12772267063458762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,4,balanced,0.13013333082199097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,4,power_law_1.01,0.13483519554138185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,4,power_law_1.01,0.1365056037902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,4,power_law_1.2,0.1374783992767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,4,power_law_1.2,0.13771519660949708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,64,balanced,0.09065066774686177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,64,balanced,0.09262933333714803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,64,power_law_1.01,0.09304959774017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,64,power_law_1.01,0.09441279768943786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,64,power_law_1.2,0.09625599980354309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,64,power_law_1.2,0.0969215989112854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,8,balanced,0.1107360025246938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,8,balanced,0.11134933431943257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,8,power_law_1.01,0.11559040546417236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,8,power_law_1.01,0.11705600023269654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,8,power_law_1.2,0.11908479928970336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,1,8,power_law_1.2,0.12012799978256225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,2,1,balanced,0.14990400274594626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,2,1,balanced,0.1506666640440623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,2,1,power_law_1.01,0.1643839955329895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,2,1,power_law_1.01,0.16535040140151977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,2,1,power_law_1.2,0.16662399768829345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,2,1,power_law_1.2,0.167193603515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,4,1,balanced,0.125109334786733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,4,1,balanced,0.1257866621017456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,4,1,power_law_1.01,0.13118720054626465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,4,1,power_law_1.01,0.13141119480133057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,4,1,power_law_1.2,0.13343360424041747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2048,768,8,128,4,1,power_law_1.2,0.13434239625930786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,1,balanced,0.47119466463724774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,1,balanced,0.4714133342107137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,1,power_law_1.01,0.49466238021850584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,1,power_law_1.01,0.49873919486999513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,1,power_law_1.2,0.5103744029998779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,1,power_law_1.2,0.5106880187988281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,128,balanced,0.12361066540082295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,128,balanced,0.12404800454775493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,128,power_law_1.01,0.1252992033958435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,128,power_law_1.01,0.12575360536575317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,128,power_law_1.2,0.12742400169372559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,128,power_law_1.2,0.12920960187911987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,16,balanced,0.14478400349617004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,16,balanced,0.14577600359916687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,16,power_law_1.01,0.1521664023399353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,16,power_law_1.01,0.15229439735412598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,16,power_law_1.2,0.15715839862823486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,16,power_law_1.2,0.15772160291671752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,2,balanced,0.30979732672373456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,2,balanced,0.3100586732228597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,2,power_law_1.01,0.32359039783477783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,2,power_law_1.01,0.3248447895050049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,2,power_law_1.2,0.3244800090789795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,2,power_law_1.2,0.3355839967727661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,32,balanced,0.13171733419100443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,32,balanced,0.1318933367729187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,32,power_law_1.01,0.13408639430999755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,32,power_law_1.01,0.137881600856781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,32,power_law_1.2,0.14060159921646118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,32,power_law_1.2,0.1410752058029175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,4,balanced,0.22191466887791952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,4,balanced,0.22447466850280762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,4,power_law_1.01,0.23199999332427979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,4,power_law_1.01,0.23705599308013917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,4,power_law_1.2,0.237062406539917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,4,power_law_1.2,0.23903999328613282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,64,balanced,0.12591466307640076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,64,balanced,0.12607466181119284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,64,power_law_1.01,0.12993919849395752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,64,power_law_1.01,0.13019520044326782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,64,power_law_1.2,0.13107199668884278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,64,power_law_1.2,0.13400319814682007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,8,balanced,0.17342400550842285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,8,balanced,0.17466133832931519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,8,power_law_1.01,0.1801792025566101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,8,power_law_1.01,0.18305920362472533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,8,power_law_1.2,0.1835968017578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,1,8,power_law_1.2,0.1843008041381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,16,1,balanced,0.7916373411814371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,16,1,balanced,0.7925066947937012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,16,1,power_law_1.01,0.8568960189819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,16,1,power_law_1.01,0.8868864059448243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,16,1,power_law_1.2,0.9185983657836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,16,1,power_law_1.2,0.9271936416625977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,2,1,balanced,0.2916853427886963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,2,1,balanced,0.29267199834187824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,2,1,power_law_1.01,0.306822395324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,2,1,power_law_1.01,0.307859206199646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,2,1,power_law_1.2,0.3101248025894165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,2,1,power_law_1.2,0.311680006980896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,32,1,balanced,0.6823893388112386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,32,1,balanced,0.6833120187123617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,32,1,power_law_1.01,0.7577727794647217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,32,1,power_law_1.01,0.7616127967834473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,32,1,power_law_1.2,0.781331205368042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,32,1,power_law_1.2,0.7954048156738281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,4,1,balanced,0.19949867328008017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,4,1,balanced,0.20148267348607382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,4,1,power_law_1.01,0.20609281063079835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,4,1,power_law_1.01,0.20728960037231445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,4,1,power_law_1.2,0.21492478847503663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,4,1,power_law_1.2,0.21503360271453859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,8,1,balanced,1.0806667009989421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,8,1,balanced,1.1186506748199463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,8,1,power_law_1.01,1.166579246520996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,8,1,power_law_1.01,1.2101568222045898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,8,1,power_law_1.2,1.2485312461853026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,2688,1856,6,128,8,1,power_law_1.2,1.2529919624328614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,1,balanced,0.7970240116119385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,1,balanced,0.7989066441853842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,1,power_law_1.01,0.7793344020843506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,1,power_law_1.01,0.7810688018798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,1,power_law_1.2,0.8035584449768066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,1,power_law_1.2,0.8136256217956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,128,balanced,0.16461333632469177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,128,balanced,0.16546666622161865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,128,power_law_1.01,0.16757760047912598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,128,power_law_1.01,0.1678976058959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,128,power_law_1.2,0.16783360242843628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,128,power_law_1.2,0.16870399713516235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,16,balanced,0.21228800217310587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,16,balanced,0.21243733167648315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,16,power_law_1.01,0.2105407953262329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,16,power_law_1.01,0.21212799549102784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,16,power_law_1.2,0.21375999450683594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,16,power_law_1.2,0.21794559955596923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,2,balanced,0.49905065695444745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,2,balanced,0.5008159875869751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,2,power_law_1.01,0.4910463809967041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,2,power_law_1.01,0.4919680118560791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,2,power_law_1.2,0.4997824192047119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,2,power_law_1.2,0.5142848014831543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,256,balanced,0.16446399688720703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,256,balanced,0.1646986703077952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,256,power_law_1.01,0.16391680240631104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,256,power_law_1.01,0.1642303943634033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,256,power_law_1.2,0.1646463990211487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,256,power_law_1.2,0.16614400148391723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,32,balanced,0.1848319967587789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,32,balanced,0.18483734130859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,32,power_law_1.01,0.18616960048675538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,32,power_law_1.01,0.1893183946609497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,32,power_law_1.2,0.19385600090026855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,32,power_law_1.2,0.19402240514755248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,4,balanced,0.34037331740061444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,4,balanced,0.3404906590779622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,4,power_law_1.01,0.3335488080978394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,4,power_law_1.01,0.3375103950500488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,4,power_law_1.2,0.3519423961639404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,4,power_law_1.2,0.35316479206085205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,64,balanced,0.17166932423909506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,64,balanced,0.17244799931844076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,64,power_law_1.01,0.17316479682922364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,64,power_law_1.01,0.17360639572143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,64,power_law_1.2,0.17377920150756837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,64,power_law_1.2,0.17638399600982665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,8,balanced,0.25524266560872394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,8,balanced,0.2553333242734273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,8,power_law_1.01,0.25528318881988527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,8,power_law_1.01,0.25632638931274415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,8,power_law_1.2,0.25975680351257324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,1,8,power_law_1.2,0.26757121086120605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,16,1,balanced,0.20468799273173013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,16,1,balanced,0.20482667287190756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,16,1,power_law_1.01,0.20378239154815675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,16,1,power_law_1.01,0.20522239208221435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,16,1,power_law_1.2,0.2106175899505615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,16,1,power_law_1.2,0.211027193069458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,2,1,balanced,0.4769013325373332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,2,1,balanced,0.4769386847813924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,2,1,power_law_1.01,0.46141438484191893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,2,1,power_law_1.01,0.46474242210388184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,2,1,power_law_1.2,0.47675518989562987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,2,1,power_law_1.2,0.4810880184173584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,32,1,balanced,0.18273067474365234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,32,1,balanced,0.18338666359583536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,32,1,power_law_1.01,0.18259199857711791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,32,1,power_law_1.01,0.18414080142974854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,32,1,power_law_1.2,0.1863808035850525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,32,1,power_law_1.2,0.1889024019241333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,4,1,balanced,0.31676266590754193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,4,1,balanced,0.31910934050877887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,4,1,power_law_1.01,0.3110016107559204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,4,1,power_law_1.01,0.31239678859710696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,4,1,power_law_1.2,0.32242560386657715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,4,1,power_law_1.2,0.3228543996810913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,8,1,balanced,0.2441706657409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,8,1,balanced,0.24420799811681113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,8,1,power_law_1.01,0.24261119365692138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,8,1,power_law_1.01,0.24308478832244873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,8,1,power_law_1.2,0.24702720642089843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,3072,1536,8,256,8,1,power_law_1.2,0.2473855972290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,1,balanced,0.603983998298645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,1,balanced,0.6058080196380615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,1,power_law_1.01,0.7179264068603516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,1,power_law_1.01,0.7472064018249511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,1,power_law_1.2,0.7311808109283447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,1,power_law_1.2,0.7356031894683838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,2,balanced,0.35226666927337646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,2,balanced,0.3561600049336751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,2,power_law_1.01,0.49566078186035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,2,power_law_1.01,0.49598078727722167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,2,power_law_1.2,0.48755841255187987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,2,power_law_1.2,0.49025278091430663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,4,balanced,0.27983466784159344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,4,balanced,0.28169065713882446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,4,power_law_1.01,0.3418303966522217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,4,power_law_1.01,0.3542335987091064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,4,power_law_1.2,0.34946560859680176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,4,power_law_1.2,0.3816832065582275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,8,balanced,0.24830400943756104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,8,balanced,0.2498826583226522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,8,power_law_1.01,0.31429119110107423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,8,power_law_1.01,0.3173759937286377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,8,power_law_1.2,0.3177792072296143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,1,8,power_law_1.2,0.3288127899169922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,16,1,balanced,0.08062399923801422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,16,1,balanced,0.08108266691366832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,16,1,power_law_1.01,0.0883520007133484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,16,1,power_law_1.01,0.08862079977989197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,16,1,power_law_1.2,0.08833280205726624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,16,1,power_law_1.2,0.09086719751358033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,2,1,balanced,0.31732799609502155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,2,1,balanced,0.3183786670366923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,2,1,power_law_1.01,0.35831680297851565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,2,1,power_law_1.01,0.3699327945709229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,2,1,power_law_1.2,0.35596160888671874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,2,1,power_law_1.2,0.36789760589599607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,32,1,balanced,0.06832533578077953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,32,1,balanced,0.06842666864395142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,32,1,power_law_1.01,0.07279999852180481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,32,1,power_law_1.01,0.0729856014251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,32,1,power_law_1.2,0.07214080095291138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,32,1,power_law_1.2,0.07343360185623168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,4,1,balanced,0.1811359922091166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,4,1,balanced,0.1850879987080892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,4,1,power_law_1.01,0.19566719532012938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,4,1,power_law_1.01,0.20313599109649658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,4,1,power_law_1.2,0.19959039688110353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,4,1,power_law_1.2,0.20254080295562743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,8,1,balanced,0.11405332883199056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,8,1,balanced,0.11563733220100403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,8,1,power_law_1.01,0.12318079471588135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,8,1,power_law_1.01,0.12520960569381714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,8,1,power_law_1.2,0.12212480306625366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,14336,2,8,8,1,power_law_1.2,0.12451200485229492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,1,balanced,0.5792479912439982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,1,balanced,0.582261323928833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,1,power_law_1.01,0.6315904140472413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,1,power_law_1.01,0.6363135814666748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,1,power_law_1.2,0.6498303890228272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,1,power_law_1.2,0.6512256145477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,128,balanced,0.15014933546384177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,128,balanced,0.15134400129318237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,128,power_law_1.01,0.15413119792938232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,128,power_law_1.01,0.1568511962890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,128,power_law_1.2,0.1606783986091614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,128,power_law_1.2,0.16327680349349977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,16,balanced,0.18027200301488241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,16,balanced,0.18147200345993042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,16,power_law_1.01,0.19875199794769288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,16,power_law_1.01,0.1993407964706421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,16,power_law_1.2,0.1985535979270935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,16,power_law_1.2,0.20131840705871581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,2,balanced,0.3809973398844401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,2,balanced,0.3811733325322469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,2,power_law_1.01,0.41077117919921874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,2,power_law_1.01,0.4128704071044922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,2,power_law_1.2,0.4282495975494385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,2,power_law_1.2,0.428326416015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,32,balanced,0.16126400232315063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,32,balanced,0.16158933440844217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,32,power_law_1.01,0.17203199863433838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,32,power_law_1.01,0.17316479682922364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,32,power_law_1.2,0.17926399707794188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,32,power_law_1.2,0.18154239654541016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,4,balanced,0.26900800069173175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,4,balanced,0.2697119911511739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,4,power_law_1.01,0.2867327928543091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,4,power_law_1.01,0.290067195892334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,4,power_law_1.2,0.29697279930114745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,4,power_law_1.2,0.3001728057861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,64,balanced,0.1541920006275177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,64,balanced,0.15435733397801718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,64,power_law_1.01,0.16154240369796752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,64,power_law_1.01,0.16264959573745727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,64,power_law_1.2,0.16624640226364135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,64,power_law_1.2,0.1687999963760376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,8,balanced,0.2122453252474467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,8,balanced,0.21251734097798666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,8,power_law_1.01,0.22641921043395996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,8,power_law_1.01,0.23386240005493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,8,power_law_1.2,0.23347198963165283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,1,8,power_law_1.2,0.23800320625305177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,16,1,balanced,0.1699999968210856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,16,1,balanced,0.17051732540130615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,16,1,power_law_1.01,0.19463679790496827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,16,1,power_law_1.01,0.19474560022354126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,16,1,power_law_1.2,0.1972864031791687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,16,1,power_law_1.2,0.19767040014266968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,2,1,balanced,0.36182932058970135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,2,1,balanced,0.3624853293100993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,2,1,power_law_1.01,0.3895359992980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,2,1,power_law_1.01,0.3915456056594849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,2,1,power_law_1.2,0.39572479724884035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,2,1,power_law_1.2,0.3974720001220703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,32,1,balanced,0.16268799702326456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,32,1,balanced,0.1629866659641266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,32,1,power_law_1.01,0.17316479682922364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,32,1,power_law_1.01,0.173580801486969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,32,1,power_law_1.2,0.1752575993537903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,32,1,power_law_1.2,0.17667839527130128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,4,1,balanced,0.2485226591428121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,4,1,balanced,0.2507733305295308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,4,1,power_law_1.01,0.27064321041107176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,4,1,power_law_1.01,0.27337601184844973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,4,1,power_law_1.2,0.2761087894439697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,4,1,power_law_1.2,0.2778815984725952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,8,1,balanced,0.20524799823760986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,8,1,balanced,0.2053333322207133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,8,1,power_law_1.01,0.21627519130706788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,8,1,power_law_1.01,0.2178431987762451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,8,1,power_law_1.2,0.21853439807891845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,1536,8,128,8,1,power_law_1.2,0.21867520809173585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,1,balanced,3.4981279373168945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,1,balanced,3.5648107528686523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,1,power_law_1.01,3.609939193725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,1,power_law_1.01,3.7195777893066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,1,power_law_1.2,3.8180286407470705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,1,power_law_1.2,3.9634239196777346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,128,balanced,0.5631999969482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,128,balanced,0.5646719932556152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,128,power_law_1.01,0.5785408020019531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,128,power_law_1.01,0.5791168212890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,128,power_law_1.2,0.5811327934265137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,128,power_law_1.2,0.5860352039337158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,16,balanced,0.7328159809112549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,16,balanced,0.7367839813232422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,16,power_law_1.01,0.7526591777801513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,16,power_law_1.01,0.7535103797912598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,16,power_law_1.2,0.7727168083190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,16,power_law_1.2,0.7785280227661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,2,balanced,2.0310400327046714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,2,balanced,2.06278403600057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,2,power_law_1.01,2.0813695907592775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,2,power_law_1.01,2.113030433654785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,2,power_law_1.2,2.1526655197143554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,2,power_law_1.2,2.184480094909668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,256,balanced,0.553599993387858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,256,balanced,0.5562719901402792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,256,power_law_1.01,0.5617856025695801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,256,power_law_1.01,0.562713623046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,256,power_law_1.2,0.5650559902191162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,256,power_law_1.2,0.5702400207519531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,32,balanced,0.6392960151036581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,32,balanced,0.6434773206710815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,32,power_law_1.01,0.6602431774139405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,32,power_law_1.01,0.6619135856628418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,32,power_law_1.2,0.6719679832458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,32,power_law_1.2,0.6744319915771484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,4,balanced,1.2834453582763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,4,balanced,1.2873013019561768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,4,power_law_1.01,1.3180224418640136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,4,power_law_1.01,1.335647964477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,4,power_law_1.2,1.3405887603759765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,4,power_law_1.2,1.3890239715576171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,64,balanced,0.5931466817855835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,64,balanced,0.594373345375061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,64,power_law_1.01,0.6012991905212403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,64,power_law_1.01,0.6069375991821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,64,power_law_1.2,0.6092095851898194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,64,power_law_1.2,0.6157760143280029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,8,balanced,0.9240640004475912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,8,balanced,0.9269013404846191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,8,power_law_1.01,0.9416959762573243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,8,power_law_1.01,0.9436736106872559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,8,power_law_1.2,0.972332763671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,1,8,power_law_1.2,0.9807999610900879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,16,1,balanced,5.776917139689128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,16,1,balanced,6.171285629272461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,16,1,power_law_1.01,6.606719970703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,16,1,power_law_1.01,6.6196739196777346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,16,1,power_law_1.2,6.818764495849609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,16,1,power_law_1.2,6.933010864257812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,2,1,balanced,1.8665013313293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,2,1,balanced,1.9760479927062988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,2,1,power_law_1.01,1.937887954711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,2,1,power_law_1.01,1.945542335510254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,2,1,power_law_1.2,1.9898880004882813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,2,1,power_law_1.2,2.0292224884033203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,32,1,balanced,4.029338518778483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,32,1,balanced,4.083392143249512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,32,1,power_law_1.01,4.427987289428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,32,1,power_law_1.01,4.454732894897461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,32,1,power_law_1.2,4.620512008666992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,32,1,power_law_1.2,4.637823867797851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,4,1,balanced,1.145840009053548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,4,1,balanced,1.148576021194458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,4,1,power_law_1.01,1.2041152000427247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,4,1,power_law_1.01,1.206668758392334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,4,1,power_law_1.2,1.2262911796569824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,4,1,power_law_1.2,1.2294079780578613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,8,1,balanced,0.780239979426066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,8,1,balanced,0.7804533640543619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,8,1,power_law_1.01,0.8087936401367187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,8,1,power_law_1.01,0.8147968292236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,8,1,power_law_1.2,0.8366847991943359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,4096,2688,22,512,8,1,power_law_1.2,0.838316822052002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,1,balanced,0.9710240364074707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,1,balanced,0.9763840039571127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,1,power_law_1.01,1.2110976219177245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,1,power_law_1.01,1.2362367630004882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,1,power_law_1.2,1.1858559608459474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,1,power_law_1.2,1.2136256217956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,2,balanced,0.549786647160848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,2,balanced,0.5581333239873251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,2,power_law_1.01,0.6955008029937744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,2,power_law_1.01,0.7008255958557129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,2,power_law_1.2,0.6610367774963379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,2,power_law_1.2,0.7205503940582275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,4,balanced,0.3592160145441691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,4,balanced,0.360485315322876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,4,power_law_1.01,0.5139200210571289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,4,power_law_1.01,0.5167424201965332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,4,power_law_1.2,0.5138432025909424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,4,power_law_1.2,0.5792448043823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,8,balanced,0.30208534002304077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,8,balanced,0.30559466282526654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,8,power_law_1.01,0.41758079528808595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,8,power_law_1.01,0.4848320007324219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,8,power_law_1.2,0.4696191787719727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,1,8,power_law_1.2,0.49069437980651853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,16,1,balanced,0.10971200466156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,16,1,balanced,0.1106826663017273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,16,1,power_law_1.01,0.1329792022705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,16,1,power_law_1.01,0.13435519933700563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,16,1,power_law_1.2,0.13456640243530274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,16,1,power_law_1.2,0.1350208044052124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,2,1,balanced,0.4713120063145955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,2,1,balanced,0.4753439823786418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,2,1,power_law_1.01,0.5767807960510254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,2,1,power_law_1.01,0.5836607933044433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,2,1,power_law_1.2,0.595142412185669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,2,1,power_law_1.2,0.5975039958953857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,32,1,balanced,0.09480533003807068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,32,1,balanced,0.09481066465377808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,32,1,power_law_1.01,0.0986240029335022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,32,1,power_law_1.01,0.09893760085105896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,32,1,power_law_1.2,0.09779840111732482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,32,1,power_law_1.2,0.09965440034866332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,4,1,balanced,0.26610134045283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,4,1,balanced,0.26864532629648846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,4,1,power_law_1.01,0.3076927900314331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,4,1,power_law_1.01,0.3084415912628174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,4,1,power_law_1.2,0.3097471952438354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,4,1,power_law_1.2,0.3101311922073364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,8,1,balanced,0.16452800234158835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,8,1,balanced,0.16517333189646402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,8,1,power_law_1.01,0.1901247978210449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,8,1,power_law_1.01,0.19236479997634887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,8,1,power_law_1.2,0.19173760414123536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,16384,2,8,8,1,power_law_1.2,0.19186559915542603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,1,balanced,1.9197386105855305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,1,balanced,2.025813261667887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,1,power_law_1.01,1.8741056442260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,1,power_law_1.01,1.882918357849121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,1,power_law_1.2,1.9845439910888671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,1,power_law_1.2,1.9959295272827149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,128,balanced,0.2664639949798584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,128,balanced,0.266485333442688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,128,power_law_1.01,0.2719167947769165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,128,power_law_1.2,0.27654399871826174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,128,power_law_1.2,0.2795072078704834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,16,balanced,0.3665013313293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,16,balanced,0.3673066695531209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,16,power_law_1.01,0.3743743896484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,16,power_law_1.01,0.3762176036834717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,16,power_law_1.2,0.38391680717468263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,16,power_law_1.2,0.3890752077102661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,2,balanced,1.1100853284200032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,2,balanced,1.1131253242492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,2,power_law_1.01,1.0875776290893555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,2,power_law_1.01,1.0965120315551757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,2,power_law_1.2,1.1411904335021972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,2,power_law_1.2,1.1447232246398926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,256,balanced,0.26263999938964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,256,balanced,0.26294400294621784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,256,power_law_1.01,0.2639616012573242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,256,power_law_1.01,0.26465280055999757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,256,power_law_1.2,0.26776320934295655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,256,power_law_1.2,0.26829440593719484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,32,balanced,0.31165866057078045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,32,balanced,0.31222933530807495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,32,power_law_1.01,0.31674880981445314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,32,power_law_1.01,0.3190399885177612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,32,power_law_1.2,0.32473599910736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,32,power_law_1.2,0.32641921043395994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,4,balanced,0.6906826496124268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,4,balanced,0.6941333611806234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,4,power_law_1.01,0.6782336235046387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,4,power_law_1.01,0.6913663864135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,4,power_law_1.2,0.7099647998809815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,4,power_law_1.2,0.7135231971740723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,64,balanced,0.2789813280105591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,64,balanced,0.2790293296178182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,64,power_law_1.01,0.28481919765472413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,64,power_law_1.01,0.28543360233306886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,64,power_law_1.2,0.2928639888763428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,64,power_law_1.2,0.2947776079177856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,8,balanced,0.4763946533203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,8,balanced,0.4766666491826375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,8,power_law_1.01,0.47598719596862793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,8,power_law_1.01,0.48190717697143554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,8,power_law_1.2,0.5005055904388428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,1,8,power_law_1.2,0.5062016010284424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,16,1,balanced,0.3678719997406006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,16,1,balanced,0.3681866725285848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,16,1,power_law_1.01,0.3670720100402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,16,1,power_law_1.01,0.3691391944885254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,16,1,power_law_1.2,0.37883520126342773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,16,1,power_law_1.2,0.38024320602416994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,2,1,balanced,1.0684266885121663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,2,1,balanced,1.0745279788970947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,2,1,power_law_1.01,1.0479616165161132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,2,1,power_law_1.01,1.0503487586975098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,2,1,power_law_1.2,1.0858752250671386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,2,1,power_law_1.2,1.091327953338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,32,1,balanced,0.3275946577390035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,32,1,balanced,0.32813866933186847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,32,1,power_law_1.01,0.3252608060836792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,32,1,power_law_1.01,0.3256959915161133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,32,1,power_law_1.2,0.33708159923553466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,32,1,power_law_1.2,0.33873279094696046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,4,1,balanced,0.6581386725107828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,4,1,balanced,0.6600213448206583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,4,1,power_law_1.01,0.6454080104827881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,4,1,power_law_1.01,0.6528704166412354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,4,1,power_law_1.2,0.6830016136169433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,4,1,power_law_1.2,0.6833792209625245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,8,1,balanced,0.4718720118204753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,8,1,balanced,0.47250131766001385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,8,1,power_law_1.01,0.463424015045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,8,1,power_law_1.01,0.46936960220336915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,8,1,power_law_1.2,0.4782144069671631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2048,8,256,8,1,power_law_1.2,0.478380823135376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,1,balanced,1.5904639561971028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,1,balanced,1.634709358215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,1,power_law_1.01,1.6439168930053711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,1,power_law_1.01,1.6481216430664063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,1,power_law_1.2,1.6914495468139648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,1,power_law_1.2,1.7075199127197265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,16,balanced,0.31995733578999835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,16,balanced,0.3222879966100057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,16,power_law_1.01,0.3482111930847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,16,power_law_1.01,0.35599360466003416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,16,power_law_1.2,0.35611519813537595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,16,power_law_1.2,0.35869441032409666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,2,balanced,0.9044319788614908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,2,balanced,0.9061013062795004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,2,power_law_1.01,0.9550271987915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,2,power_law_1.01,0.9706624031066895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,2,power_law_1.2,1.0019007682800294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,2,power_law_1.2,1.0147199630737305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,32,balanced,0.27356799443562824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,32,balanced,0.27400533358256024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,32,power_law_1.01,0.2931839942932129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,32,power_law_1.01,0.295743989944458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,32,power_law_1.2,0.30495998859405515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,32,power_law_1.2,0.30522880554199217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,4,balanced,0.5708426634470621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,4,balanced,0.5742666721343994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,4,power_law_1.01,0.6053952217102051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,4,power_law_1.01,0.6073728084564209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,4,power_law_1.2,0.6294335842132568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,4,power_law_1.2,0.6424831867218017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,8,balanced,0.40725334485371906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,8,balanced,0.407968004544576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,8,power_law_1.01,0.43148159980773926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,8,power_law_1.01,0.44387202262878417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,8,power_law_1.2,0.45242881774902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,1,8,power_law_1.2,0.45708160400390624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,16,1,balanced,0.3086293339729309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,16,1,balanced,0.3092533349990845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,16,1,power_law_1.01,0.32205440998077395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,16,1,power_law_1.01,0.32376320362091066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,16,1,power_law_1.2,0.3265023946762085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,16,1,power_law_1.2,0.3288831949234009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,2,1,balanced,0.8617386817932129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,2,1,balanced,0.8686827023824056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,2,1,power_law_1.01,0.922822380065918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,2,1,power_law_1.01,0.9347583770751953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,2,1,power_law_1.2,0.9462528228759766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,2,1,power_law_1.2,0.9472576141357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,32,1,balanced,0.28065067529678345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,32,1,balanced,0.28123732407887775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,32,1,power_law_1.01,0.29410560131073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,32,1,power_law_1.01,0.29611520767211913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,32,1,power_law_1.2,0.3001024007797241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,32,1,power_law_1.2,0.3019520044326782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,4,1,balanced,0.5374186833699545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,4,1,balanced,0.5378559827804565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,4,1,power_law_1.01,0.5654143810272216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,4,1,power_law_1.01,0.5727935791015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,4,1,power_law_1.2,0.5816319942474365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,4,1,power_law_1.2,0.5830527782440186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,8,1,balanced,0.36948267618815106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,8,1,balanced,0.3712586561838786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,8,1,power_law_1.01,0.40741119384765623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,8,1,power_law_1.01,0.40953598022460935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,8,1,power_law_1.2,0.4135744094848633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,6144,2560,8,160,8,1,power_law_1.2,0.41390080451965333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,1,balanced,2.2212959925333657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,1,balanced,2.233674685160319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,1,power_law_1.01,2.1463296890258787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,1,power_law_1.01,2.2296703338623045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,1,power_law_1.2,2.288025665283203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,1,power_law_1.2,2.2927040100097655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,128,balanced,0.2918879985809326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,128,balanced,0.292741338411967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,128,power_law_1.01,0.2960383892059326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,128,power_law_1.01,0.29742720127105715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,128,power_law_1.2,0.30204799175262453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,128,power_law_1.2,0.30275840759277345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,16,balanced,0.4092693328857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,16,balanced,0.4100106557210286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,16,power_law_1.01,0.41948161125183103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,16,power_law_1.01,0.4218111991882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,16,power_law_1.2,0.41936001777648924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,16,power_law_1.2,0.4269440174102783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,2,balanced,1.2731093565622966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,2,balanced,1.3002346356709797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,2,power_law_1.01,1.2508735656738281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,2,power_law_1.01,1.2538111686706543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,2,power_law_1.2,1.2742207527160645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,2,power_law_1.2,1.3063615798950194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,256,balanced,0.2860959966977437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,256,balanced,0.2861386736234029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,256,power_law_1.01,0.2881472110748291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,256,power_law_1.01,0.28890879154205323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,256,power_law_1.2,0.29513599872589114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,256,power_law_1.2,0.2977920055389404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,32,balanced,0.34169065952301025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,32,balanced,0.34278400739034015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,32,power_law_1.01,0.34292480945587156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,32,power_law_1.01,0.35415680408477784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,32,power_law_1.2,0.3555072069168091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,32,power_law_1.2,0.35934081077575686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,4,balanced,0.7859306335449219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,4,balanced,0.785973310470581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,4,power_law_1.01,0.7691391944885254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,4,power_law_1.01,0.7739456176757813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,4,power_law_1.2,0.797657585144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,4,power_law_1.2,0.8079168319702148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,64,balanced,0.3028320074081421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,64,balanced,0.30567999680836994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,64,power_law_1.01,0.30963840484619143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,64,power_law_1.01,0.31132800579071046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,64,power_law_1.2,0.3219903945922852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,64,power_law_1.2,0.3265023946762085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,8,balanced,0.532367984453837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,8,balanced,0.5341279904047648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,8,power_law_1.01,0.527788782119751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,8,power_law_1.01,0.5405824184417725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,8,power_law_1.2,0.5564991950988769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,1,8,power_law_1.2,0.5605311870574952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,16,1,balanced,0.4207679828008016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,16,1,balanced,0.4209280014038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,16,1,power_law_1.01,0.418668794631958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,16,1,power_law_1.01,0.4247488021850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,16,1,power_law_1.2,0.43317761421203616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,16,1,power_law_1.2,0.43495678901672363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,2,1,balanced,1.2357866764068604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,2,1,balanced,1.2502079804738362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,2,1,power_law_1.01,1.1990464210510254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,2,1,power_law_1.01,1.2199423789978028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,2,1,power_law_1.2,1.254297637939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,2,1,power_law_1.2,1.2653759956359862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,32,1,balanced,0.37481598059336346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,32,1,balanced,0.3755093415578206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,32,1,power_law_1.01,0.3745343923568726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,32,1,power_law_1.01,0.377836799621582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,32,1,power_law_1.2,0.38496639728546145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,32,1,power_law_1.2,0.3870464086532593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,4,1,balanced,0.7570559978485107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,4,1,balanced,0.7595787048339844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,4,1,power_law_1.01,0.7489408016204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,4,1,power_law_1.01,0.7490816116333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,4,1,power_law_1.2,0.7860544204711915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,4,1,power_law_1.2,0.7899519920349121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,8,1,balanced,0.540229320526123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,8,1,balanced,0.540880004564921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,8,1,power_law_1.01,0.535539197921753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,8,1,power_law_1.01,0.5356607913970948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,8,1,power_law_1.2,0.5466559886932373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,256,8,1,power_law_1.2,0.5502655982971192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,1,balanced,3.485136032104492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,1,balanced,3.566495895385742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,1,power_law_1.01,3.001491165161133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,1,power_law_1.01,3.094508743286133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,1,power_law_1.2,3.0592063903808593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,1,power_law_1.2,3.2487808227539063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,128,balanced,0.3545120159784953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,128,balanced,0.3546239932378133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,128,power_law_1.01,0.35612800121307375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,128,power_law_1.01,0.3591936111450195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,128,power_law_1.2,0.3587519884109497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,128,power_law_1.2,0.3608191967010498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,16,balanced,0.5252639849980673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,16,balanced,0.527509331703186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,16,power_law_1.01,0.5179200172424316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,16,power_law_1.01,0.5214655876159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,16,power_law_1.2,0.5188864231109619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,16,power_law_1.2,0.5237247943878174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,2,balanced,1.8167626063028972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,2,balanced,1.8194506963094075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,2,power_law_1.01,1.6646463394165039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,2,power_law_1.01,1.6946304321289063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,2,power_law_1.2,1.7017152786254883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,2,power_law_1.2,1.7256767272949218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,32,balanced,0.43271998564402264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,32,balanced,0.4331093231836955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,32,power_law_1.01,0.4251584053039551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,32,power_law_1.01,0.4286464214324951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,32,power_law_1.2,0.43415040969848634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,32,power_law_1.2,0.4394752025604248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,4,balanced,1.0831092993418376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,4,balanced,1.0852426687876384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,4,power_law_1.01,0.9729280471801758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,4,power_law_1.01,1.0211775779724122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,4,power_law_1.2,1.017523193359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,4,power_law_1.2,1.0211520195007324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,64,balanced,0.37932801246643066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,64,balanced,0.3796373208363851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,64,power_law_1.01,0.38008320331573486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,64,power_law_1.01,0.38103039264678956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,64,power_law_1.2,0.3852927923202515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,64,power_law_1.2,0.3879296064376831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,8,balanced,0.7184267044067383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,8,balanced,0.7190879980723063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,8,power_law_1.01,0.6695744037628174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,8,power_law_1.01,0.6934591770172119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,8,power_law_1.2,0.6980480194091797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,1,8,power_law_1.2,0.7033408164978028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,16,1,balanced,0.5860586563746134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,16,1,balanced,0.5873119831085205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,16,1,power_law_1.01,0.5470848083496094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,16,1,power_law_1.01,0.5493696212768555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,16,1,power_law_1.2,0.5561279773712158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,16,1,power_law_1.2,0.5568448066711426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,2,1,balanced,1.842842737833659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,2,1,balanced,1.8647839228312175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,2,1,power_law_1.01,1.5975104331970216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,2,1,power_law_1.01,1.6082368850708009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,2,1,power_law_1.2,1.6485376358032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,2,1,power_law_1.2,1.6608383178710937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,32,1,balanced,0.5283840099970499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,32,1,balanced,0.5284106731414795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,32,1,power_law_1.01,0.494982385635376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,32,1,power_law_1.01,0.4967872142791748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,32,1,power_law_1.2,0.5077375888824462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,32,1,power_law_1.2,0.5081791877746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,4,1,balanced,1.0933866500854492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,4,1,balanced,1.0947360197703044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,4,1,power_law_1.01,0.9834367752075195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,4,1,power_law_1.01,0.9897472381591796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,4,1,power_law_1.2,1.0082048416137694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,4,1,power_law_1.2,1.0175359725952149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,8,1,balanced,0.7603413263956705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,8,1,balanced,0.7614080111185709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,8,1,power_law_1.01,0.6826687812805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,8,1,power_law_1.01,0.6902783870697021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,8,1,power_law_1.2,0.6948991775512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1024,7168,2048,8,384,8,1,power_law_1.2,0.6996287822723388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,1,balanced,1.1516319910685222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,1,balanced,1.1561013062795003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,1,power_law_1.01,1.2167296409606934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,1,power_law_1.01,1.2230591773986816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,1,power_law_1.2,1.2358336448669434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,1,power_law_1.2,1.2375295639038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,128,balanced,0.6777546405792236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,128,balanced,0.6781706809997559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,128,power_law_1.01,0.7116159915924072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,128,power_law_1.01,0.7134463787078857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,128,power_law_1.2,0.7427328109741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,128,power_law_1.2,0.7435776233673096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,16,balanced,0.7096800009409586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,16,balanced,0.7098346551259359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,16,power_law_1.01,0.7675903797149658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,16,power_law_1.01,0.7676479816436768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,16,power_law_1.2,0.7699391841888428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,16,power_law_1.2,0.7765567779541016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,2,balanced,0.962773323059082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,2,balanced,0.9681493441263834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,2,power_law_1.01,1.01592960357666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,2,power_law_1.01,1.029702377319336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,2,power_law_1.2,1.05283203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,2,power_law_1.2,1.0650943756103515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,32,balanced,0.6926080385843912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,32,balanced,0.6944213708241781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,32,power_law_1.01,0.7190847873687745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,32,power_law_1.01,0.7585536003112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,32,power_law_1.2,0.7623424053192138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,32,power_law_1.2,0.7693632125854493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,4,balanced,0.8144266605377197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,4,balanced,0.8259946505228678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,4,power_law_1.01,0.8785920143127441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,4,power_law_1.01,0.8834815979003906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,4,power_law_1.2,0.893939208984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,4,power_law_1.2,0.9198016166687012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,64,balanced,0.6826186974843343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,64,balanced,0.6829973061879476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,64,power_law_1.01,0.7145599842071533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,64,power_law_1.01,0.7228288173675537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,64,power_law_1.2,0.7583871841430664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,64,power_law_1.2,0.765996789932251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,8,balanced,0.745247999827067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,8,balanced,0.7480959892272949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,8,power_law_1.01,0.8005184173583985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,8,power_law_1.01,0.8038335800170898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,8,power_law_1.2,0.8302592277526856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,1,8,power_law_1.2,0.8449407577514648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,2,1,balanced,0.8193653424580892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,2,1,balanced,0.821125348409017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,2,1,power_law_1.01,0.8703295707702636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,2,1,power_law_1.01,0.8713343620300293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,2,1,power_law_1.2,0.8783743858337403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,2,1,power_law_1.2,0.8792575836181641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,4,1,balanced,0.6860106786092123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,4,1,balanced,0.6921813488006592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,4,1,power_law_1.01,0.729472017288208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,4,1,power_law_1.01,0.733900785446167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,4,1,power_law_1.2,0.7352447986602784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2048,768,8,128,4,1,power_law_1.2,0.7386303901672363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,1,balanced,2.0636693636576333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,1,balanced,2.1076265970865884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,1,power_law_1.01,2.1230016708374024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,1,power_law_1.01,2.157721519470215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,1,power_law_1.2,2.167526435852051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,1,power_law_1.2,2.172652816772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,128,balanced,0.8708799680074056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,128,balanced,0.8713119824727377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,128,power_law_1.01,0.9433535575866699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,128,power_law_1.01,0.948038387298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,128,power_law_1.2,1.0252351760864258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,128,power_law_1.2,1.0462207794189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,16,balanced,0.9478027025858561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,16,balanced,0.9511040051778158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,16,power_law_1.01,1.0394432067871093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,16,power_law_1.01,1.0492351531982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,16,power_law_1.2,1.0639616012573243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,16,power_law_1.2,1.0823552131652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,2,balanced,1.527685324350993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,2,balanced,1.5322880744934082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,2,power_law_1.01,1.6391807556152345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,2,power_law_1.01,1.6628736495971679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,2,power_law_1.2,1.6462976455688476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,2,power_law_1.2,1.6777856826782227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,32,balanced,0.9034773508707682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,32,balanced,0.903557300567627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,32,power_law_1.01,0.98538236618042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,32,power_law_1.01,1.0018752098083497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,32,power_law_1.2,1.032262420654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,32,power_law_1.2,1.0401535987854005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,4,balanced,1.197424014409383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,4,balanced,1.2047839959462483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,4,power_law_1.01,1.2787455558776855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,4,power_law_1.01,1.2988800048828124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,4,power_law_1.2,1.3582528114318848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,4,power_law_1.2,1.375712013244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,64,balanced,0.8833119869232178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,64,balanced,0.8859466711680094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,64,power_law_1.01,0.9618623733520508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,64,power_law_1.01,0.9668352127075195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,64,power_law_1.2,1.0187904357910156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,64,power_law_1.2,1.0487808227539062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,8,balanced,1.0308319727579753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,8,balanced,1.0342880090077717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,8,power_law_1.01,1.104691219329834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,8,power_law_1.01,1.1614015579223633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,8,power_law_1.2,1.152064037322998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,1,8,power_law_1.2,1.1559679985046387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,16,1,balanced,3.7792800267537436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,16,1,balanced,3.785717328389486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,16,1,power_law_1.01,3.7793216705322266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,16,1,power_law_1.01,3.7849472045898436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,16,1,power_law_1.2,3.8165119171142576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,16,1,power_law_1.2,3.8268287658691404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,2,1,balanced,1.3384426434834797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,2,1,balanced,1.3418773015340169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,2,1,power_law_1.01,1.3732864379882812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,2,1,power_law_1.01,1.3794048309326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,2,1,power_law_1.2,1.3892288208007812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,2,1,power_law_1.2,1.390944004058838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,32,1,balanced,3.3033278783162436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,32,1,balanced,3.3212105433146157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,32,1,power_law_1.01,3.400678253173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,32,1,power_law_1.01,3.4073471069335937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,32,1,power_law_1.2,3.415903854370117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,32,1,power_law_1.2,3.423244857788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,4,1,balanced,0.9705173174540201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,4,1,balanced,0.9720693429311117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,4,1,power_law_1.01,0.9929535865783692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,4,1,power_law_1.01,0.9985983848571778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,4,1,power_law_1.2,1.0053312301635742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,4,1,power_law_1.2,1.0089216232299805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,8,1,balanced,4.92193063100179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,8,1,balanced,4.954863866170247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,8,1,power_law_1.01,4.885913467407226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,8,1,power_law_1.01,5.14521598815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,8,1,power_law_1.2,5.159449768066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,2688,1856,6,128,8,1,power_law_1.2,5.160800170898438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,1,balanced,2.5808266003926597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,1,balanced,2.6408960024515786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,1,power_law_1.01,2.7404800415039063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,1,power_law_1.01,2.7666431427001954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,1,power_law_1.2,2.7977344512939455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,1,power_law_1.2,2.8216831207275392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,128,balanced,1.0226506392161052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,128,balanced,1.0241599877675374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,128,power_law_1.01,1.074732780456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,128,power_law_1.01,1.0940671920776368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,128,power_law_1.2,1.1250368118286134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,128,power_law_1.2,1.1418560028076172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,16,balanced,1.1152373154958088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,16,balanced,1.1204906304677327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,16,power_law_1.01,1.2157312393188477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,16,power_law_1.01,1.222707176208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,16,power_law_1.2,1.2684224128723145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,16,power_law_1.2,1.2796480178833007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,2,balanced,1.8238666852315266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,2,balanced,1.8255306879679363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,2,power_law_1.01,2.0220672607421877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,2,power_law_1.01,2.0501632690429688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,2,power_law_1.2,2.0688575744628905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,2,power_law_1.2,2.132671928405762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,256,balanced,1.015349308649699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,256,balanced,1.0170613129933674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,256,power_law_1.01,1.0629055976867676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,256,power_law_1.01,1.0654911994934082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,256,power_law_1.2,1.1078783988952636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,256,power_law_1.2,1.1130559921264649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,32,balanced,1.0640746752421062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,32,balanced,1.0647520224253337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,32,power_law_1.01,1.1408767700195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,32,power_law_1.01,1.1540863990783692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,32,power_law_1.2,1.178649616241455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,32,power_law_1.2,1.1829055786132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,4,balanced,1.4215893745422363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,4,balanced,1.4273120562235515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,4,power_law_1.01,1.5838720321655273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,4,power_law_1.01,1.5894847869873048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,4,power_law_1.2,1.6042112350463866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,4,power_law_1.2,1.6190336227416993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,64,balanced,1.0372533003489177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,64,balanced,1.0375040372212727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,64,power_law_1.01,1.1043456077575684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,64,power_law_1.01,1.1050368309020997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,64,power_law_1.2,1.1378303527832032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,64,power_law_1.2,1.1644415855407715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,8,balanced,1.2184373537699382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,8,balanced,1.2258773644765217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,8,power_law_1.01,1.3031999588012695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,8,power_law_1.01,1.3187007904052734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,8,power_law_1.2,1.3996159553527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,1,8,power_law_1.2,1.4131391525268555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,16,1,balanced,0.8627466360727946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,16,1,balanced,0.8646079699198405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,16,1,power_law_1.01,0.924563217163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,16,1,power_law_1.01,0.9286975860595703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,16,1,power_law_1.2,0.933465576171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,16,1,power_law_1.2,0.9381759643554688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,2,1,balanced,1.613024075826009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,2,1,balanced,1.6163733800252278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,2,1,power_law_1.01,1.7604352951049804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,2,1,power_law_1.01,1.7684480667114257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,2,1,power_law_1.2,1.7953151702880858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,2,1,power_law_1.2,1.7977216720581055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,32,1,balanced,0.8095520337422689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,32,1,balanced,0.8105920155843099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,32,1,power_law_1.01,0.8691007614135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,32,1,power_law_1.01,0.8696127891540527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,32,1,power_law_1.2,0.8770496368408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,32,1,power_law_1.2,0.880281639099121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,4,1,balanced,1.1455199718475342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,4,1,balanced,1.1495947043100994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,4,1,power_law_1.01,1.2424768447875976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,4,1,power_law_1.01,1.249612808227539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,4,1,power_law_1.2,1.262598419189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,4,1,power_law_1.2,1.2673343658447265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,8,1,balanced,0.9614293575286865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,8,1,balanced,0.9624533653259277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,8,1,power_law_1.01,1.0313728332519532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,8,1,power_law_1.01,1.0349568367004394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,8,1,power_law_1.2,1.044825553894043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,3072,1536,8,256,8,1,power_law_1.2,1.0502016067504882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,1,balanced,5.759093602498372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,1,balanced,5.784058888753255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,1,power_law_1.01,5.715711975097657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,1,power_law_1.01,5.785305786132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,1,power_law_1.2,5.741670227050781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,1,power_law_1.2,5.82677116394043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,2,balanced,3.4867626825968423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,2,balanced,3.5313758850097656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,2,power_law_1.01,4.171417617797852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,2,power_law_1.01,4.173235321044922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,2,power_law_1.2,3.9088382720947266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,2,power_law_1.2,3.972582244873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,4,balanced,2.4464213053385415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,4,balanced,2.4689013163248696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,4,power_law_1.01,3.4788158416748045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,4,power_law_1.01,4.187366485595703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,4,power_law_1.2,3.3934398651123048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,4,power_law_1.2,4.106079864501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,8,balanced,1.9649759928385417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,8,balanced,1.9665120442708333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,8,power_law_1.01,3.48089599609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,8,power_law_1.01,3.484089660644531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,8,power_law_1.2,3.4240257263183596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,1,8,power_law_1.2,3.563955307006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,16,1,balanced,0.5584213336308798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,16,1,balanced,0.5591520071029663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,16,1,power_law_1.01,0.5690688133239746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,16,1,power_law_1.01,0.5773248195648193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,16,1,power_law_1.2,0.570911979675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,16,1,power_law_1.2,0.5711232185363769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,2,1,balanced,2.847797393798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,2,1,balanced,2.873994509379069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,2,1,power_law_1.01,2.7627775192260744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,2,1,power_law_1.01,2.8401023864746096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,2,1,power_law_1.2,2.7780351638793945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,2,1,power_law_1.2,2.805471992492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,32,1,balanced,0.4303893248240153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,32,1,balanced,0.43699200948079425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,32,1,power_law_1.01,0.43962879180908204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,32,1,power_law_1.01,0.4434944152832031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,32,1,power_law_1.2,0.44280319213867186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,32,1,power_law_1.2,0.4453567981719971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,4,1,balanced,1.4457813898722331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,4,1,balanced,1.486021359761556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,4,1,power_law_1.01,1.451155185699463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,4,1,power_law_1.01,1.4701184272766112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,4,1,power_law_1.2,1.4447360038757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,4,1,power_law_1.2,1.4737279891967774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,8,1,balanced,0.834000031153361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,8,1,balanced,0.8398773670196533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,8,1,power_law_1.01,0.8495039939880371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,8,1,power_law_1.01,0.8691904067993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,8,1,power_law_1.2,0.8573887825012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,14336,2,8,8,1,power_law_1.2,0.866374397277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,1,balanced,2.990629196166992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,1,balanced,3.086602528889974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,1,power_law_1.01,3.137830352783203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,1,power_law_1.01,3.149318313598633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,1,power_law_1.2,3.1109312057495115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,1,power_law_1.2,3.1129087448120116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,128,balanced,1.1420213381449382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,128,balanced,1.144208033879598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,128,power_law_1.01,1.2563136100769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,128,power_law_1.01,1.2736127853393555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,128,power_law_1.2,1.3428863525390624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,128,power_law_1.2,1.3568063735961915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,16,balanced,1.2505706946055095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,16,balanced,1.2547679742177327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,16,power_law_1.01,1.3842687606811523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,16,power_law_1.01,1.4247679710388184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,16,power_law_1.2,1.4737152099609374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,16,power_law_1.2,1.537440013885498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,2,balanced,2.128544012705485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,2,balanced,2.129093329111735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,2,power_law_1.01,2.314675140380859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,2,power_law_1.01,2.3533248901367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,2,power_law_1.2,2.3900224685668947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,2,power_law_1.2,2.4112319946289062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,32,balanced,1.1886773109436035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,32,balanced,1.1933813095092773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,32,power_law_1.01,1.3302528381347656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,32,power_law_1.01,1.362451171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,32,power_law_1.2,1.4178815841674806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,32,power_law_1.2,1.4272768020629882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,4,balanced,1.6267733573913574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,4,balanced,1.6276960372924805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,4,power_law_1.01,1.7769279479980469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,4,power_law_1.01,1.8137792587280273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,4,power_law_1.2,1.8257152557373046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,4,power_law_1.2,1.837331199645996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,64,balanced,1.1555786927541096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,64,balanced,1.1589706738789876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,64,power_law_1.01,1.296236801147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,64,power_law_1.01,1.3367487907409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,64,power_law_1.2,1.3437888145446777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,64,power_law_1.2,1.3772735595703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,8,balanced,1.3681333859761555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,8,balanced,1.3710986773173015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,8,power_law_1.01,1.560531234741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,8,power_law_1.01,1.5648511886596679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,8,power_law_1.2,1.540454387664795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,1,8,power_law_1.2,1.6610431671142578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,16,1,balanced,1.049829324086507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,16,1,balanced,1.0513599713643391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,16,1,power_law_1.01,1.0927935600280763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,16,1,power_law_1.01,1.099827194213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,16,1,power_law_1.2,1.0998527526855468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,16,1,power_law_1.2,1.109113597869873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,2,1,balanced,1.898954709370931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,2,1,balanced,1.9049173990885417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,2,1,power_law_1.01,2.008070373535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,2,1,power_law_1.01,2.0084352493286133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,2,1,power_law_1.2,2.0289791107177733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,2,1,power_law_1.2,2.042163276672363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,32,1,balanced,0.9892373085021973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,32,1,balanced,0.9902293682098389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,32,1,power_law_1.01,1.0339520454406739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,32,1,power_law_1.01,1.0359295845031737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,32,1,power_law_1.2,1.0425663948059083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,32,1,power_law_1.2,1.042636775970459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,4,1,balanced,1.3674079577128093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,4,1,balanced,1.3730613390604656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,4,1,power_law_1.01,1.4446975708007812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,4,1,power_law_1.01,1.4551551818847657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,4,1,power_law_1.2,1.451360034942627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,4,1,power_law_1.2,1.454700756072998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,8,1,balanced,1.1615359783172607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,8,1,balanced,1.1655253569285076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,8,1,power_law_1.01,1.2161855697631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,8,1,power_law_1.01,1.2182592391967773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,8,1,power_law_1.2,1.2226495742797852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,1536,8,128,8,1,power_law_1.2,1.2305536270141602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,1,balanced,16.120426177978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,1,balanced,16.287957509358723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,1,power_law_1.01,15.669708251953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,1,power_law_1.01,15.679200744628906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,1,power_law_1.2,15.860557556152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,1,power_law_1.2,15.951795959472657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,128,balanced,4.137200037638347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,128,balanced,4.145610809326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,128,power_law_1.01,4.344678497314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,128,power_law_1.01,4.3585662841796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,128,power_law_1.2,4.468953704833984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,128,power_law_1.2,4.501939010620117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,16,balanced,4.744592030843099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,16,balanced,4.765568097432454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,16,power_law_1.01,5.006521606445313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,16,power_law_1.01,5.090124893188476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,16,power_law_1.2,5.121734237670898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,16,power_law_1.2,5.218259048461914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,2,balanced,10.054170608520508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,2,balanced,10.073504130045572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,2,power_law_1.01,9.94361572265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,2,power_law_1.01,9.945721435546876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,2,power_law_1.2,10.001331329345703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,2,power_law_1.2,10.460601806640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,256,balanced,4.090538660685222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,256,balanced,4.095466613769531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,256,power_law_1.01,4.248057556152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,256,power_law_1.01,4.264128112792969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,256,power_law_1.2,4.378976058959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,256,power_law_1.2,4.460838317871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,32,balanced,4.392538706461589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,32,balanced,4.419120152791341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,32,power_law_1.01,4.630150222778321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,32,power_law_1.01,4.666937637329101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,32,power_law_1.2,4.930239868164063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,32,power_law_1.2,4.946656036376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,4,balanced,6.762613296508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,4,balanced,6.786373138427734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,4,power_law_1.01,6.866751861572266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,4,power_law_1.01,7.068115234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,4,power_law_1.2,7.346092987060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,4,power_law_1.2,7.539084625244141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,64,balanced,4.2249759038289385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,64,balanced,4.228831926981608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,64,power_law_1.01,4.449299240112305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,64,power_law_1.01,4.468102264404297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,64,power_law_1.2,4.63702392578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,64,power_law_1.2,4.661766433715821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,8,balanced,5.478906631469727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,8,balanced,5.492501576741536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,8,power_law_1.01,5.628979110717774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,8,power_law_1.01,5.802783966064453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,8,power_law_1.2,5.855424118041992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,1,8,power_law_1.2,5.9656318664550785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,16,1,balanced,27.140912373860676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,16,1,balanced,27.749867757161457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,16,1,power_law_1.01,27.06696472167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,16,1,power_law_1.01,27.33463134765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,16,1,power_law_1.2,27.46251525878906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,16,1,power_law_1.2,27.845343017578124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,2,1,balanced,9.196320215861002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,2,1,balanced,9.247557322184244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,2,1,power_law_1.01,8.791129302978515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,2,1,power_law_1.01,9.148076629638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,2,1,power_law_1.2,8.883833312988282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,2,1,power_law_1.2,9.153740692138673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,32,1,balanced,19.88593037923177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,32,1,balanced,19.951727549235027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,32,1,power_law_1.01,18.97900848388672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,32,1,power_law_1.01,19.00765380859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,32,1,power_law_1.2,19.174342346191406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,32,1,power_law_1.2,19.24493408203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,4,1,balanced,5.650773366292317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,4,1,balanced,5.872688293457031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,4,1,power_law_1.01,5.540531158447266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,4,1,power_law_1.01,5.562112045288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,4,1,power_law_1.2,5.559936141967773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,4,1,power_law_1.2,5.611411285400391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,8,1,balanced,4.152213414510091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,8,1,balanced,4.165578524271647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,8,1,power_law_1.01,4.000780868530273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,8,1,power_law_1.01,4.03966064453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,8,1,power_law_1.2,4.051302337646485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,4096,2688,22,512,8,1,power_law_1.2,4.083840179443359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,1,balanced,9.177679697672525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,1,balanced,9.31438954671224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,1,power_law_1.01,9.324416351318359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,1,power_law_1.01,9.460435485839843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,1,power_law_1.2,9.2093505859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,1,power_law_1.2,9.522297668457032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,2,balanced,5.26749324798584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,2,balanced,5.315600077311198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,2,power_law_1.01,6.86145248413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,2,power_law_1.01,6.978854370117188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,2,power_law_1.2,7.031833648681641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,2,power_law_1.2,7.274240112304687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,4,balanced,3.3159891764322915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,4,balanced,3.3646027247111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,4,power_law_1.01,5.397030258178711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,4,power_law_1.01,5.7605632781982425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,4,power_law_1.2,5.273440170288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,4,power_law_1.2,6.009408187866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,8,balanced,2.515941301981608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,8,balanced,2.5262346267700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,8,power_law_1.01,4.527328109741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,8,power_law_1.01,4.995264053344727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,8,power_law_1.2,4.659404754638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,1,8,power_law_1.2,5.111558532714843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,16,1,balanced,0.8357439835866293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,16,1,balanced,0.8402933279673258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,16,1,power_law_1.01,0.8453248023986817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,16,1,power_law_1.01,0.8508607864379882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,16,1,power_law_1.2,0.8453887939453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,16,1,power_law_1.2,0.8485247611999511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,2,1,balanced,4.502581278483073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,2,1,balanced,4.568319956461589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,2,1,power_law_1.01,4.415200042724609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,2,1,power_law_1.01,4.526943969726562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,2,1,power_law_1.2,4.429395294189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,2,1,power_law_1.2,4.52105598449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,32,1,balanced,0.6193439960479736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,32,1,balanced,0.6270933151245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,32,1,power_law_1.01,0.6335296154022216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,32,1,power_law_1.01,0.6412032127380372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,32,1,power_law_1.2,0.6306111812591553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,32,1,power_law_1.2,0.6336383819580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,4,1,balanced,2.352229277292887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,4,1,balanced,2.459712028503418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,4,1,power_law_1.01,2.3027456283569334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,4,1,power_law_1.01,2.346502494812012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,4,1,power_law_1.2,2.300262451171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,4,1,power_law_1.2,2.370732879638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,8,1,balanced,1.2884533405303955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,8,1,balanced,1.3128373622894287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,8,1,power_law_1.01,1.3125375747680663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,8,1,power_law_1.01,1.3267200469970704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,8,1,power_law_1.2,1.31593599319458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,16384,2,8,8,1,power_law_1.2,1.325836753845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,1,balanced,5.851770401000977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,1,balanced,6.162197113037109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,1,power_law_1.01,6.651058959960937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,1,power_law_1.01,6.741862487792969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,1,power_law_1.2,6.833529663085938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,1,power_law_1.2,6.876332855224609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,128,balanced,1.635482629140218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,128,balanced,1.6386292775472004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,128,power_law_1.01,1.771878433227539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,128,power_law_1.01,1.776019287109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,128,power_law_1.2,1.889241600036621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,128,power_law_1.2,1.8951423645019532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,16,balanced,1.8647573788960774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,16,balanced,1.8690773646036785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,16,power_law_1.01,2.0951295852661134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,16,power_law_1.01,2.0986303329467773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,16,power_law_1.2,2.239366340637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,16,power_law_1.2,2.2711551666259764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,2,balanced,3.6905972162882485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,2,balanced,3.7279841105143228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,2,power_law_1.01,4.277753448486328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,2,power_law_1.01,4.280467224121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,2,power_law_1.2,4.362374496459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,2,power_law_1.2,4.453785705566406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,256,balanced,1.6194240252176921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,256,balanced,1.6195786794026692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,256,power_law_1.01,1.7364864349365234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,256,power_law_1.01,1.7380352020263672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,256,power_law_1.2,1.8585535049438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,256,power_law_1.2,1.8911296844482421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,32,balanced,1.7302667299906414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,32,balanced,1.7341972986857097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,32,power_law_1.01,1.925766372680664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,32,power_law_1.01,1.9508159637451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,32,power_law_1.2,2.0693248748779296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,32,power_law_1.2,2.112211227416992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,4,balanced,2.6683521270751953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,4,balanced,2.6877225240071616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,4,power_law_1.01,3.0521984100341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,4,power_law_1.01,3.0552383422851563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,4,power_law_1.2,3.1029247283935546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,4,power_law_1.2,3.153753662109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,64,balanced,1.6670026779174805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,64,balanced,1.6749866803487141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,64,power_law_1.01,1.8200576782226563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,64,power_law_1.01,1.8216768264770509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,64,power_law_1.2,1.9563264846801758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,64,power_law_1.2,1.9688064575195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,8,balanced,2.113386631011963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,8,balanced,2.136826674143473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,8,power_law_1.01,2.4418943405151365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,8,power_law_1.01,2.468729591369629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,8,power_law_1.2,2.5449920654296876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,1,8,power_law_1.2,2.5788991928100584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,16,1,balanced,1.5321760177612305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,16,1,balanced,1.5331625938415527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,16,1,power_law_1.01,1.6339967727661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,16,1,power_law_1.01,1.6357568740844726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,16,1,power_law_1.2,1.6485055923461913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,16,1,power_law_1.2,1.6504575729370117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,2,1,balanced,3.4453760782877603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,2,1,balanced,3.4918880462646484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,2,1,power_law_1.01,3.7488128662109377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,2,1,power_law_1.01,3.8072063446044924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,2,1,power_law_1.2,3.747129440307617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,2,1,power_law_1.2,3.787583923339844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,32,1,balanced,1.4164907137552898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,32,1,balanced,1.4184106190999348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,32,1,power_law_1.01,1.5180224418640136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,32,1,power_law_1.01,1.5187071800231933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,32,1,power_law_1.2,1.529971218109131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,32,1,power_law_1.2,1.5347071647644044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,4,1,balanced,2.2511679331461587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,4,1,balanced,2.264906724294027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,4,1,power_law_1.01,2.475347137451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,4,1,power_law_1.01,2.479827117919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,4,1,power_law_1.2,2.479974365234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,4,1,power_law_1.2,2.4962303161621096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,8,1,balanced,1.7750132878621419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,8,1,balanced,1.7812587420145671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,8,1,power_law_1.01,1.8956607818603515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,8,1,power_law_1.01,1.8957248687744142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,8,1,power_law_1.2,1.921625518798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2048,8,256,8,1,power_law_1.2,1.9301504135131835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,1,balanced,7.105338414510091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,1,balanced,7.121695836385091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,1,power_law_1.01,7.424658966064453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,1,power_law_1.01,7.478444671630859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,1,power_law_1.2,7.246771240234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,1,power_law_1.2,7.290035247802734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,16,balanced,2.023530642191569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,16,balanced,2.02839994430542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,16,power_law_1.01,2.3442495346069334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,16,power_law_1.01,2.3657087326049804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,16,power_law_1.2,2.5703935623168945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,16,power_law_1.2,2.6390335083007814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,2,balanced,4.240864117940267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,2,balanced,4.283034642537435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,2,power_law_1.01,4.6789695739746096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,2,power_law_1.01,4.965139389038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,2,power_law_1.2,5.003231811523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,2,power_law_1.2,5.029164886474609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,32,balanced,1.8665067354838054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,32,balanced,1.8676533699035645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,32,power_law_1.01,2.197279930114746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,32,power_law_1.01,2.2064128875732423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,32,power_law_1.2,2.3511871337890624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,32,power_law_1.2,2.448134422302246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,4,balanced,2.9831040700276694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,4,balanced,2.9878880182902017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,4,power_law_1.01,3.2919551849365236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,4,power_law_1.01,3.3499454498291015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,4,power_law_1.2,3.379129409790039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,4,power_law_1.2,3.384844970703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,8,balanced,2.3374560674031577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,8,balanced,2.338714599609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,8,power_law_1.01,2.7237119674682617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,8,power_law_1.01,2.835699272155762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,8,power_law_1.2,2.811801528930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,1,8,power_law_1.2,2.9776063919067384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,16,1,balanced,1.6708319981892903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,16,1,balanced,1.6712160110473633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,16,1,power_law_1.01,1.724928092956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,16,1,power_law_1.01,1.7299776077270508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,16,1,power_law_1.2,1.732262420654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,16,1,power_law_1.2,1.7373184204101562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,2,1,balanced,3.925365447998047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,2,1,balanced,3.967834790547689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,2,1,power_law_1.01,4.037484741210937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,2,1,power_law_1.01,4.053753662109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,2,1,power_law_1.2,4.086758422851562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,2,1,power_law_1.2,4.110655975341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,32,1,balanced,1.5125279426574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,32,1,balanced,1.5175946553548176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,32,1,power_law_1.01,1.5662976264953614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,32,1,power_law_1.01,1.571571159362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,32,1,power_law_1.2,1.5809151649475097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,32,1,power_law_1.2,1.5876735687255858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,4,1,balanced,2.541744073232015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,4,1,balanced,2.5477919578552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,4,1,power_law_1.01,2.6493568420410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,4,1,power_law_1.01,2.6555456161499023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,4,1,power_law_1.2,2.658758354187012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,4,1,power_law_1.2,2.666841506958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,8,1,balanced,1.8993439674377441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,8,1,balanced,1.9002985954284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,8,1,power_law_1.01,1.9839040756225585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,8,1,power_law_1.01,1.9917568206787108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,8,1,power_law_1.2,1.9958911895751954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,6144,2560,8,160,8,1,power_law_1.2,1.9963775634765626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,1,balanced,6.712469100952148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,1,balanced,6.789632161458333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,1,power_law_1.01,7.523366546630859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,1,power_law_1.01,7.829357147216797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,1,power_law_1.2,7.9137214660644535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,1,power_law_1.2,7.92639389038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,128,balanced,1.7930773099263508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,128,balanced,1.7994240125020344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,128,power_law_1.01,1.951545524597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,128,power_law_1.01,1.9539775848388672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,128,power_law_1.2,2.1069055557250977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,128,power_law_1.2,2.1267839431762696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,16,balanced,2.0662026405334473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,16,balanced,2.06768528620402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,16,power_law_1.01,2.334943962097168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,16,power_law_1.01,2.3412160873413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,16,power_law_1.2,2.432352066040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,16,power_law_1.2,2.496735954284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,2,balanced,4.407290776570638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,2,balanced,4.468021392822266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,2,power_law_1.01,4.807494354248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,2,power_law_1.01,4.815110397338867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,2,power_law_1.2,5.1001537322998045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,2,power_law_1.2,5.221478271484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,256,balanced,1.777359962463379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,256,balanced,1.7789546648661296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,256,power_law_1.01,1.9073663711547852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,256,power_law_1.01,1.9379520416259766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,256,power_law_1.2,2.0781375885009767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,256,power_law_1.2,2.113702392578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,32,balanced,1.9059947331746419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,32,balanced,1.9101707140604656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,32,power_law_1.01,2.1067903518676756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,32,power_law_1.01,2.1230783462524414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,32,power_law_1.2,2.2755775451660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,32,power_law_1.2,2.297382354736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,4,balanced,3.0110559463500977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,4,balanced,3.0180320739746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,4,power_law_1.01,3.395123291015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,4,power_law_1.01,3.487596893310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,4,power_law_1.2,3.6449535369873045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,4,power_law_1.2,3.8230079650878905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,64,balanced,1.8279147148132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,64,balanced,1.837546666463216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,64,power_law_1.01,2.0243904113769533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,64,power_law_1.01,2.0328575134277345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,64,power_law_1.2,2.182137680053711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,64,power_law_1.2,2.2573375701904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,8,balanced,2.37665065129598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,8,balanced,2.37827205657959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,8,power_law_1.01,2.707724761962891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,8,power_law_1.01,2.760076713562012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,8,power_law_1.2,2.8082815170288087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,1,8,power_law_1.2,2.9679487228393553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,16,1,balanced,1.7450879414876301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,16,1,balanced,1.7505173683166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,16,1,power_law_1.01,1.8685823440551759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,16,1,power_law_1.01,1.8716863632202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,16,1,power_law_1.2,1.8815999984741212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,16,1,power_law_1.2,1.883795166015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,2,1,balanced,3.920111974080404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,2,1,balanced,3.955882708231608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,2,1,power_law_1.01,4.279148864746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,2,1,power_law_1.01,4.36426887512207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,2,1,power_law_1.2,4.3263294219970705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,2,1,power_law_1.2,4.371443176269532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,32,1,balanced,1.612661361694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,32,1,balanced,1.6141494115193684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,32,1,power_law_1.01,1.7350719451904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,32,1,power_law_1.01,1.7408128738403321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,32,1,power_law_1.2,1.748627281188965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,32,1,power_law_1.2,1.7539007186889648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,4,1,balanced,2.561178684234619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,4,1,balanced,2.59006404876709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,4,1,power_law_1.01,2.828044891357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,4,1,power_law_1.01,2.86362247467041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,4,1,power_law_1.2,2.855129623413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,4,1,power_law_1.2,2.8792064666748045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,8,1,balanced,2.035871982574463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,8,1,balanced,2.036640008290609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,8,1,power_law_1.01,2.1785215377807616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,8,1,power_law_1.01,2.182099151611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,8,1,power_law_1.2,2.1984960556030275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,256,8,1,power_law_1.2,2.2035072326660154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,1,balanced,7.552256266276042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,1,balanced,7.6014455159505205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,1,power_law_1.01,8.626445007324218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,1,power_law_1.01,8.767231750488282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,1,power_law_1.2,8.953632354736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,1,power_law_1.2,9.003794860839843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,128,balanced,1.8517279624938965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,128,balanced,1.8543626467386882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,128,power_law_1.01,1.9858816146850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,128,power_law_1.01,2.0276607513427733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,128,power_law_1.2,2.0718591690063475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,128,power_law_1.2,2.086272048950195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,16,balanced,2.136133352915446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,16,balanced,2.1425280570983887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,16,power_law_1.01,2.3618751525878907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,16,power_law_1.01,2.3974336624145507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,16,power_law_1.2,2.5308416366577147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,16,power_law_1.2,2.5458751678466798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,2,balanced,4.5734453201293945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,2,balanced,4.591231981913249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,2,power_law_1.01,5.218342590332031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,2,power_law_1.01,5.3089344024658205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,2,power_law_1.2,5.481919860839843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,2,power_law_1.2,5.574009704589844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,32,balanced,1.972991943359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,32,balanced,1.9739947319030762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,32,power_law_1.01,2.1777280807495116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,32,power_law_1.01,2.2407936096191405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,32,power_law_1.2,2.306150436401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,32,power_law_1.2,2.3478527069091797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,4,balanced,3.108304023742676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,4,balanced,3.1203254063924155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,4,power_law_1.01,3.5439998626708986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,4,power_law_1.01,3.6236095428466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,4,power_law_1.2,3.6848831176757812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,4,power_law_1.2,3.8148094177246095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,64,balanced,1.892682711283366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,64,balanced,1.8950079282124836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,64,power_law_1.01,2.0378623962402345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,64,power_law_1.01,2.0603328704833985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,64,power_law_1.2,2.1236352920532227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,64,power_law_1.2,2.1523839950561525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,8,balanced,2.4725653330485025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,8,balanced,2.474208037058512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,8,power_law_1.01,2.7673343658447265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,8,power_law_1.01,2.787833595275879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,8,power_law_1.2,2.9363967895507814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,1,8,power_law_1.2,2.9507904052734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,16,1,balanced,1.817263921101888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,16,1,balanced,1.8180267016092937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,16,1,power_law_1.01,1.9723840713500977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,16,1,power_law_1.01,1.9836160659790039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,16,1,power_law_1.2,2.026361656188965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,16,1,power_law_1.2,2.0336063385009764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,2,1,balanced,4.120640118916829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,2,1,balanced,4.361557324727376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,2,1,power_law_1.01,4.692812728881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,2,1,power_law_1.01,4.845657730102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,2,1,power_law_1.2,4.833760070800781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,2,1,power_law_1.2,4.984819030761718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,32,1,balanced,1.6745386123657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,32,1,balanced,1.6764267285664876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,32,1,power_law_1.01,1.833203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,32,1,power_law_1.01,1.833670425415039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,32,1,power_law_1.2,1.8658432006835937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,32,1,power_law_1.2,1.8678335189819335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,4,1,balanced,2.703653335571289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,4,1,balanced,2.7312161127726235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,4,1,power_law_1.01,3.068339157104492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,4,1,power_law_1.01,3.0839231491088865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,4,1,power_law_1.2,3.146816062927246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,4,1,power_law_1.2,3.1501951217651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,8,1,balanced,2.1254080136617026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,8,1,balanced,2.1267360051472983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,8,1,power_law_1.01,2.336031913757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,8,1,power_law_1.01,2.3368192672729493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,8,1,power_law_1.2,2.3874496459960937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,12288,7168,2048,8,384,8,1,power_law_1.2,2.3888383865356446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,1,balanced,0.1481706698735555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,1,balanced,0.14825066924095154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,1,power_law_1.01,0.14120960235595703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,1,power_law_1.01,0.1415488004684448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,1,power_law_1.2,0.1417088031768799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,1,power_law_1.2,0.14320000410079955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,128,balanced,0.04479999840259552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,128,balanced,0.04573333263397217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,128,power_law_1.01,0.0434112012386322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,128,power_law_1.01,0.043609601259231565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,128,power_law_1.2,0.04337919950485229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,128,power_law_1.2,0.043673598766326906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,16,balanced,0.04615999758243561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,16,balanced,0.04618666569391886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,16,power_law_1.01,0.04525440037250519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,16,power_law_1.01,0.04555520117282867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,16,power_law_1.2,0.045433598756790164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,16,power_law_1.2,0.046137601137161255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,2,balanced,0.09679999947547913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,2,balanced,0.09702400366465251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,2,power_law_1.01,0.09354239702224731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,2,power_law_1.01,0.09455360174179077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,2,power_law_1.2,0.09435520172119141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,2,power_law_1.2,0.09489920139312744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,32,balanced,0.04490133126576742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,32,balanced,0.04593066871166229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,32,power_law_1.01,0.04425599873065948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,32,power_law_1.01,0.044460800290107724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,32,power_law_1.2,0.04472320079803467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,32,power_law_1.2,0.044819200038909913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,4,balanced,0.07246933380762736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,4,balanced,0.07258133093516032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,4,power_law_1.01,0.06921600103378296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,4,power_law_1.01,0.06958720088005066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,4,power_law_1.2,0.06952959895133973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,4,power_law_1.2,0.070278400182724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,64,balanced,0.04561600089073181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,64,balanced,0.04577066500981649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,64,power_law_1.01,0.043635201454162595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,64,power_law_1.01,0.043968001008033754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,64,power_law_1.2,0.044012799859046936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,64,power_law_1.2,0.044121599197387694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,8,balanced,0.050245334704717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,8,balanced,0.05162666738033295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,8,power_law_1.01,0.048307201266288756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,8,power_law_1.01,0.049542400240898135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,8,power_law_1.2,0.050291198492050174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,1,8,power_law_1.2,0.05075200200080872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,2,1,balanced,0.09850133458773296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,2,1,balanced,0.09897599617640178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,2,1,power_law_1.01,0.09313920140266418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,2,1,power_law_1.01,0.09430400133132935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,2,1,power_law_1.2,0.09540479779243469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,2,1,power_law_1.2,0.09557759761810303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,4,1,balanced,0.07454933226108551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,4,1,balanced,0.07483733197053273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,4,1,power_law_1.01,0.07184000015258789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,4,1,power_law_1.01,0.07249919772148132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,4,1,power_law_1.2,0.07216640114784241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2048,768,8,128,4,1,power_law_1.2,0.07268480062484742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,1,balanced,0.35517334938049316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,1,balanced,0.35656531651814777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,1,power_law_1.01,0.320249605178833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,1,power_law_1.01,0.3218816041946411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,1,power_law_1.2,0.3241280078887939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,1,power_law_1.2,0.3331072092056274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,128,balanced,0.060234665870666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,128,balanced,0.062208001812299095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,128,power_law_1.01,0.059059202671051025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,128,power_law_1.01,0.05980160236358643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,128,power_law_1.2,0.059308797121047974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,128,power_law_1.2,0.0593280017375946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,16,balanced,0.07277333239714305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,16,balanced,0.07306666672229767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,16,power_law_1.01,0.06897280216217042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,16,power_law_1.01,0.07071999907493591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,16,power_law_1.2,0.07004160284996033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,16,power_law_1.2,0.07087360024452209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,2,balanced,0.21316266059875488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,2,balanced,0.2169439991315206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,2,power_law_1.01,0.19034240245819092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,2,power_law_1.01,0.20449280738830566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,2,power_law_1.2,0.1913856029510498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,2,power_law_1.2,0.19925119876861572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,32,balanced,0.0626453310251236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,32,balanced,0.06363200147946675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,32,power_law_1.01,0.061868798732757566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,32,power_law_1.01,0.06238080263137817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,32,power_law_1.2,0.06180480122566223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,32,power_law_1.2,0.061964797973632815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,4,balanced,0.1381386617819468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,4,balanced,0.13833600282669067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,4,power_law_1.01,0.1277184009552002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,4,power_law_1.01,0.1329792022705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,4,power_law_1.2,0.13175040483474731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,4,power_law_1.2,0.13185280561447144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,64,balanced,0.06211199859778086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,64,balanced,0.062218666076660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,64,power_law_1.01,0.05974400043487549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,64,power_law_1.01,0.06046079993247986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,64,power_law_1.2,0.06047999858856201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,64,power_law_1.2,0.06088320016860962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,8,balanced,0.10101333260536194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,8,balanced,0.10128532846768697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,8,power_law_1.01,0.08907520174980163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,8,power_law_1.01,0.09095680117607116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,8,power_law_1.2,0.0917568027973175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,1,8,power_law_1.2,0.09557759761810303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,16,1,balanced,0.9058720270792643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,16,1,balanced,0.9290133317311605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,16,1,power_law_1.01,0.7365503787994385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,16,1,power_law_1.01,0.8079487800598144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,16,1,power_law_1.2,0.6928895950317383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,16,1,power_law_1.2,0.8390336036682129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,2,1,balanced,0.21215466658274332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,2,1,balanced,0.2141546607017517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,2,1,power_law_1.01,0.19140479564666749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,2,1,power_law_1.01,0.1926911950111389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,2,1,power_law_1.2,0.18929280042648317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,2,1,power_law_1.2,0.1978432059288025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,32,1,balanced,0.7551893393198649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,32,1,balanced,0.7818186283111572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,32,1,power_law_1.01,0.7414207935333252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,32,1,power_law_1.01,0.7525887966156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,32,1,power_law_1.2,0.6136703968048096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,32,1,power_law_1.2,0.7482816219329834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,4,1,balanced,0.1395039955774943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,4,1,balanced,0.1411626636981964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,4,1,power_law_1.01,0.12871040105819703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,4,1,power_law_1.01,0.13144960403442382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,4,1,power_law_1.2,0.13022719621658324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,4,1,power_law_1.2,0.13253120183944703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,8,1,balanced,1.1010186672210693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,8,1,balanced,1.2077759901682537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,8,1,power_law_1.01,1.033132839202881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,8,1,power_law_1.01,1.078592014312744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,8,1,power_law_1.2,0.9340352058410645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,2688,1856,6,128,8,1,power_law_1.2,1.0549440383911133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,1,balanced,0.6003946860631307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,1,balanced,0.6028746763865153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,1,power_law_1.01,0.4935488224029541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,1,power_law_1.01,0.5054975986480713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,1,power_law_1.2,0.4947968006134033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,1,power_law_1.2,0.5110655784606933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,128,balanced,0.09095999598503113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,128,balanced,0.09121599793434143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,128,power_law_1.01,0.09014400243759155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,128,power_law_1.01,0.09020159840583801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,128,power_law_1.2,0.08981760144233704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,128,power_law_1.2,0.08999680280685425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,16,balanced,0.12358400225639343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,16,balanced,0.12468266487121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,16,power_law_1.01,0.11269760131835938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,16,power_law_1.01,0.11694079637527466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,16,power_law_1.2,0.11493760347366333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,16,power_law_1.2,0.11614079475402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,2,balanced,0.35211201508839923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,2,balanced,0.3529226779937744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,2,power_law_1.01,0.2977920055389404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,2,power_law_1.01,0.3088511943817139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,2,power_law_1.2,0.29256319999694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,2,power_law_1.2,0.30256640911102295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,256,balanced,0.09070932865142822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,256,balanced,0.09096533060073853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,256,power_law_1.01,0.08926079869270324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,256,power_law_1.01,0.08935040235519409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,256,power_law_1.2,0.08895999789237977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,256,power_law_1.2,0.08946560025215149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,32,balanced,0.10142933328946431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,32,balanced,0.1023573378721873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,32,power_law_1.01,0.09744639992713929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,32,power_law_1.01,0.09869440197944641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,32,power_law_1.2,0.09832320213317872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,32,power_law_1.2,0.09968640208244324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,4,balanced,0.22429333130518594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,4,balanced,0.22524267435073853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,4,power_law_1.01,0.19527679681777954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,4,power_law_1.01,0.2022847890853882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,4,power_law_1.2,0.2059391975402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,4,power_law_1.2,0.21697280406951905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,64,balanced,0.09291199843088786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,64,balanced,0.09316800038019817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,64,power_law_1.01,0.09091839790344239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,64,power_law_1.01,0.09166719913482665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,64,power_law_1.2,0.09070720076560974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,64,power_law_1.2,0.09159039855003356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,8,balanced,0.1580959955851237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,8,balanced,0.15847999850908914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,8,power_law_1.01,0.14476799964904785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,8,power_law_1.01,0.14799360036849976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,8,power_law_1.2,0.14264960289001466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,1,8,power_law_1.2,0.14526079893112182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,16,1,balanced,0.13333866993586221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,16,1,balanced,0.133925328652064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,16,1,power_law_1.01,0.11130880117416382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,16,1,power_law_1.2,0.11080960035324097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,16,1,power_law_1.2,0.11399040222167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,2,1,balanced,0.33958931763966876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,2,1,balanced,0.3401493231455485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,2,1,power_law_1.01,0.2882496118545532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,2,1,power_law_1.01,0.29086079597473147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,2,1,power_law_1.2,0.28694400787353513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,2,1,power_law_1.2,0.28808960914611814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,32,1,balanced,0.11340799927711487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,32,1,balanced,0.11353600025177002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,32,1,power_law_1.01,0.10106879472732544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,32,1,power_law_1.01,0.10135040283203126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,32,1,power_law_1.2,0.10022399425506592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,32,1,power_law_1.2,0.10080000162124633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,4,1,balanced,0.2182240088780721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,4,1,balanced,0.21938133239746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,4,1,power_law_1.01,0.18574719429016112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,4,1,power_law_1.01,0.18752000331878663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,4,1,power_law_1.2,0.18322559595108032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,4,1,power_law_1.2,0.18773119449615477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,8,1,balanced,0.15522133310635886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,8,1,balanced,0.15803733468055725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,8,1,power_law_1.01,0.14067840576171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,8,1,power_law_1.01,0.14370559453964232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,8,1,power_law_1.2,0.13978879451751708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,3072,1536,8,256,8,1,power_law_1.2,0.14135680198669434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,1,balanced,0.28201067447662354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,1,balanced,0.2844906648000081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,1,power_law_1.01,0.28462719917297363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,1,power_law_1.01,0.2933759927749634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,1,power_law_1.2,0.29051520824432375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,1,power_law_1.2,0.2955904006958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,2,balanced,0.19669866561889648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,2,balanced,0.1994719902674357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,2,power_law_1.01,0.20084478855133056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,2,power_law_1.01,0.2094208002090454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,2,power_law_1.2,0.19823360443115234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,2,power_law_1.2,0.1982848048210144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,4,balanced,0.15272000432014465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,4,balanced,0.15362667044003805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,4,power_law_1.01,0.15616639852523803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,4,power_law_1.01,0.15768320560455323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,4,power_law_1.2,0.1535104036331177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,4,power_law_1.2,0.15611519813537597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,8,balanced,0.1240000029404958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,8,balanced,0.12708800037701926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,8,power_law_1.01,0.13073279857635497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,8,power_law_1.01,0.1347391963005066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,8,power_law_1.2,0.13114880323410033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,1,8,power_law_1.2,0.13432960510253905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,16,1,balanced,0.04780266682306925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,16,1,balanced,0.047872001926104225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,16,1,power_law_1.01,0.050316798686981204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,16,1,power_law_1.01,0.05315200090408325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,16,1,power_law_1.2,0.0493120014667511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,16,1,power_law_1.2,0.05070719718933105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,2,1,balanced,0.16482133666674295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,2,1,balanced,0.1674720048904419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,2,1,power_law_1.01,0.16097919940948485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,2,1,power_law_1.01,0.16132479906082153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,2,1,power_law_1.2,0.16225279569625856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,2,1,power_law_1.2,0.1652351975440979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,32,1,balanced,0.03745600084463755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,32,1,balanced,0.03978666663169861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,32,1,power_law_1.01,0.03772160112857818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,32,1,power_law_1.01,0.03845759928226471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,32,1,power_law_1.2,0.037599998712539676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,32,1,power_law_1.2,0.03952000141143799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,4,1,balanced,0.10521066188812256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,4,1,balanced,0.10613333185513814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,4,1,power_law_1.01,0.10191999673843384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,4,1,power_law_1.01,0.10328960418701172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,4,1,power_law_1.2,0.10363520383834839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,4,1,power_law_1.2,0.10373120307922364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,8,1,balanced,0.06697600086530049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,8,1,balanced,0.07004266480604808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,8,1,power_law_1.01,0.06629120111465454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,8,1,power_law_1.01,0.06637439727783204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,8,1,power_law_1.2,0.06467199921607972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,14336,2,8,8,1,power_law_1.2,0.06495360136032105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,1,balanced,0.4175146818161011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,1,balanced,0.4219893217086792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,1,power_law_1.01,0.40082559585571287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,1,power_law_1.01,0.40176000595092776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,1,power_law_1.2,0.402188777923584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,1,power_law_1.2,0.40842881202697756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,128,balanced,0.06689066688219707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,128,balanced,0.06816000243028005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,128,power_law_1.01,0.06585599780082703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,128,power_law_1.01,0.06624000072479248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,128,power_law_1.2,0.06628479957580566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,128,power_law_1.2,0.06696959733963012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,16,balanced,0.08469333251317342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,16,balanced,0.084906667470932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,16,power_law_1.01,0.08287360072135926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,16,power_law_1.01,0.08382080197334289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,16,power_law_1.2,0.082259202003479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,16,power_law_1.2,0.08273919820785522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,2,balanced,0.24709333976109824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,2,balanced,0.24936532974243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,2,power_law_1.01,0.24001920223236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,2,power_law_1.01,0.24069759845733643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,2,power_law_1.2,0.237062406539917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,2,power_law_1.2,0.2438271999359131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,32,balanced,0.0715946654478709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,32,balanced,0.07452799876530965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,32,power_law_1.01,0.07049599885940552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,32,power_law_1.01,0.07088639736175537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,32,power_law_1.2,0.07071999907493591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,32,power_law_1.2,0.0716543972492218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,4,balanced,0.15546666582425436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,4,balanced,0.15594133734703064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,4,power_law_1.01,0.15141119956970214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,4,power_law_1.01,0.1515391945838928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,4,power_law_1.2,0.15073920488357545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,4,power_law_1.2,0.15358079671859742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,64,balanced,0.06818133095900218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,64,balanced,0.0684746652841568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,64,power_law_1.01,0.0673471987247467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,64,power_law_1.01,0.06807039976119995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,64,power_law_1.2,0.067084801197052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,64,power_law_1.2,0.06716160178184509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,8,balanced,0.11188800136248271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,8,balanced,0.11342400312423706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,8,power_law_1.01,0.10755840539932252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,8,power_law_1.01,0.1087488055229187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,8,power_law_1.2,0.10976639986038209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,1,8,power_law_1.2,0.11127040386199952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,16,1,balanced,0.09845866759618123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,16,1,balanced,0.09935999910036723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,16,1,power_law_1.01,0.09418879747390747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,16,1,power_law_1.01,0.09467520117759705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,16,1,power_law_1.2,0.09566720128059387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,16,1,power_law_1.2,0.09635840058326721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,2,1,balanced,0.24409067630767822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,2,1,balanced,0.2449280023574829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,2,1,power_law_1.01,0.23299200534820558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,2,1,power_law_1.01,0.23722240924835206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,2,1,power_law_1.2,0.23924479484558106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,2,1,power_law_1.2,0.2396480083465576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,32,1,balanced,0.0862559974193573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,32,1,balanced,0.08669867118199666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,32,1,power_law_1.01,0.08263040184974671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,32,1,power_law_1.01,0.08350080251693726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,32,1,power_law_1.2,0.08182399868965148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,32,1,power_law_1.2,0.08423039913177491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,4,1,balanced,0.15663466850916544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,4,1,balanced,0.15923733512560526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,4,1,power_law_1.01,0.1488960027694702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,4,1,power_law_1.01,0.14945919513702394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,4,1,power_law_1.2,0.14917759895324706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,4,1,power_law_1.2,0.1518847942352295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,8,1,balanced,0.11719466249148051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,8,1,balanced,0.11829333504041036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,8,1,power_law_1.01,0.10987520217895508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,8,1,power_law_1.01,0.11179519891738891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,8,1,power_law_1.2,0.11091840267181396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,1536,8,128,8,1,power_law_1.2,0.11349760293960572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,1,balanced,2.618511994679769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,1,balanced,2.6266773541768393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,1,power_law_1.01,2.2965696334838865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,1,power_law_1.01,2.3300607681274412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,1,power_law_1.2,2.3283008575439452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,1,power_law_1.2,2.349772834777832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,128,balanced,0.2589813272158305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,128,balanced,0.2600640058517456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,128,power_law_1.01,0.2562495946884155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,128,power_law_1.01,0.2571712017059326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,128,power_law_1.2,0.25613439083099365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,128,power_law_1.2,0.25681281089782715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,16,balanced,0.41502400239308673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,16,balanced,0.41680534680684406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,16,power_law_1.01,0.3934976100921631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,16,power_law_1.01,0.40102400779724123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,16,power_law_1.2,0.4024064064025879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,16,power_law_1.2,0.40470399856567385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,2,balanced,1.4449812571207683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,2,balanced,1.4526933034261067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,2,power_law_1.01,1.2906432151794434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,2,power_law_1.01,1.3278271675109863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,2,power_law_1.2,1.3060735702514648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,2,power_law_1.2,1.3190976142883302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,256,balanced,0.25304534037907916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,256,balanced,0.2547786633173625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,256,power_law_1.01,0.2532416105270386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,256,power_law_1.01,0.25333120822906496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,256,power_law_1.2,0.2527551889419556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,256,power_law_1.2,0.25277440547943114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,32,balanced,0.3301706711451213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,32,balanced,0.33242666721343994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,32,power_law_1.01,0.3249536037445068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,32,power_law_1.01,0.3255359888076782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,32,power_law_1.2,0.32478721141815187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,32,power_law_1.2,0.32598400115966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,4,balanced,0.8621439933776855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,4,balanced,0.8680640061696371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,4,power_law_1.01,0.7783616065979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,4,power_law_1.01,0.7888512134552002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,4,power_law_1.2,0.8025216102600098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,4,power_law_1.2,0.8166399955749511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,64,balanced,0.2791893283526103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,64,balanced,0.27937599023183185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,64,power_law_1.01,0.2708735942840576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,64,power_law_1.01,0.27331199645996096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,64,power_law_1.2,0.2706496000289917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,64,power_law_1.2,0.2777343988418579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,8,balanced,0.5655786593755087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,8,balanced,0.567850669225057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,8,power_law_1.01,0.5343167781829834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,8,power_law_1.01,0.5428415775299072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,8,power_law_1.2,0.5258560180664062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,1,8,power_law_1.2,0.533510398864746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,16,1,balanced,5.545759836832683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,16,1,balanced,6.222415924072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,16,1,power_law_1.01,5.6528575897216795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,16,1,power_law_1.01,5.658348846435547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,16,1,power_law_1.2,5.269868850708008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,16,1,power_law_1.2,5.5929920196533205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,2,1,balanced,1.3657066027323406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,2,1,balanced,1.4091946283976238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,2,1,power_law_1.01,1.2074048042297363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,2,1,power_law_1.01,1.215833568572998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,2,1,power_law_1.2,1.2250240325927735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,2,1,power_law_1.2,1.2257216453552247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,32,1,balanced,3.9764480590820312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,32,1,balanced,4.391205469767253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,32,1,power_law_1.01,3.3553726196289064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,32,1,power_law_1.01,4.176224136352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,32,1,power_law_1.2,3.235443115234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,32,1,power_law_1.2,3.5960769653320312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,4,1,balanced,0.7804373105367025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,4,1,balanced,0.781493345896403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,4,1,power_law_1.01,0.6956736087799072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,4,1,power_law_1.01,0.699180793762207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,4,1,power_law_1.2,0.699507188796997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,4,1,power_law_1.2,0.7032320022583007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,8,1,balanced,0.49326932430267334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,8,1,balanced,0.4968959887822469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,8,1,power_law_1.01,0.4507711887359619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,8,1,power_law_1.01,0.451526403427124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,8,1,power_law_1.2,0.4540736198425293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,4096,2688,22,512,8,1,power_law_1.2,0.45665922164916994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,1,balanced,0.4269333283106486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,1,balanced,0.4272853136062622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,1,power_law_1.01,0.4812863826751709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,1,power_law_1.01,0.4964479923248291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,1,power_law_1.2,0.4524672031402588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,1,power_law_1.2,0.47983360290527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,2,balanced,0.27049599091211957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,2,balanced,0.2735626697540283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,2,power_law_1.01,0.28216960430145266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,2,power_law_1.01,0.28718080520629885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,2,power_law_1.2,0.2886528015136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,2,power_law_1.2,0.2891455888748169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,4,balanced,0.1983733375867208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,4,balanced,0.19914132356643677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,4,power_law_1.01,0.20269439220428467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,4,power_law_1.01,0.2043839931488037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,4,power_law_1.2,0.20413439273834227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,4,power_law_1.2,0.20472960472106932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,8,balanced,0.15017599860827127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,8,balanced,0.15030933419863382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,8,power_law_1.01,0.16619520187377929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,8,power_law_1.01,0.17230080366134642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,8,power_law_1.2,0.17144960165023804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,1,8,power_law_1.2,0.1726464033126831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,16,1,balanced,0.07169066866238911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,16,1,balanced,0.07232533395290375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,16,1,power_law_1.01,0.07200639843940734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,16,1,power_law_1.01,0.07217280268669128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,16,1,power_law_1.2,0.07095040082931518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,16,1,power_law_1.2,0.07313920259475708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,2,1,balanced,0.24177600940068564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,2,1,balanced,0.24555732806523642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,2,1,power_law_1.01,0.24776959419250488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,2,1,power_law_1.01,0.2569472074508667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,2,1,power_law_1.2,0.2508352041244507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,2,1,power_law_1.2,0.25701758861541746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,32,1,balanced,0.04740266501903534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,32,1,balanced,0.05203733344872793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,32,1,power_law_1.01,0.05616639852523804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,32,1,power_law_1.01,0.057030397653579715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,32,1,power_law_1.2,0.05459200143814087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,32,1,power_law_1.2,0.057657599449157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,4,1,balanced,0.14877866705258688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,4,1,balanced,0.14921067158381143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,4,1,power_law_1.01,0.14774399995803833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,4,1,power_law_1.01,0.14784640073776245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,4,1,power_law_1.2,0.1475711941719055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,4,1,power_law_1.2,0.15145599842071533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,8,1,balanced,0.0916319986184438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,8,1,balanced,0.09449066718419392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,8,1,power_law_1.01,0.08782079815864563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,8,1,power_law_1.01,0.0901632010936737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,8,1,power_law_1.2,0.08903679847717286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,16384,2,8,8,1,power_law_1.2,0.09047039747238159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,1,balanced,1.5312426884969075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,1,balanced,1.5348854064941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,1,power_law_1.01,1.27456636428833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,1,power_law_1.01,1.2836031913757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,1,power_law_1.2,1.2410943984985352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,1,power_law_1.2,1.278752040863037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,128,balanced,0.14203199744224548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,128,balanced,0.1421280006567637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,128,power_law_1.01,0.13950719833374023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,128,power_law_1.01,0.1401535987854004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,128,power_law_1.2,0.14005119800567628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,128,power_law_1.2,0.14014079570770263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,16,balanced,0.2301386594772339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,16,balanced,0.23091200987497965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,16,power_law_1.01,0.21571838855743408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,16,power_law_1.01,0.21767039299011232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,16,power_law_1.2,0.22132480144500732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,16,power_law_1.2,0.2232448101043701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,2,balanced,0.8401546478271484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,2,balanced,0.8431893189748129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,2,power_law_1.01,0.7080319881439209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,2,power_law_1.01,0.734764814376831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,2,power_law_1.2,0.7016255855560303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,2,power_law_1.2,0.7187456130981446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,256,balanced,0.13801599542299905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,256,balanced,0.14029332995414734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,256,power_law_1.01,0.1364799976348877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,256,power_law_1.01,0.13683199882507324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,256,power_law_1.2,0.1361407995223999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,256,power_law_1.2,0.13615360260009765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,32,balanced,0.17133333285649618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,32,balanced,0.17166399955749512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,32,power_law_1.01,0.162009596824646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,32,power_law_1.01,0.16588159799575805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,32,power_law_1.2,0.1615679979324341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,32,power_law_1.2,0.16547199487686157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,4,balanced,0.4888053337732951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,4,balanced,0.4891039927800496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,4,power_law_1.01,0.4225791931152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,4,power_law_1.01,0.44140801429748533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,4,power_law_1.2,0.4371327877044678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,4,power_law_1.2,0.43889918327331545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,64,balanced,0.14869866768519083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,64,balanced,0.14909332990646362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,64,power_law_1.01,0.14531840085983277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,64,power_law_1.01,0.145632004737854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,64,power_law_1.2,0.14484479427337646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,64,power_law_1.2,0.14504319429397583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,8,balanced,0.3158613244692485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,8,balanced,0.31679999828338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,8,power_law_1.01,0.2862207889556885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,8,power_law_1.01,0.31223039627075194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,8,power_law_1.2,0.28231039047241213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,1,8,power_law_1.2,0.29097599983215333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,16,1,balanced,0.24207466840744019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,16,1,balanced,0.24226133028666177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,16,1,power_law_1.01,0.2024832010269165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,16,1,power_law_1.01,0.20363519191741944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,16,1,power_law_1.2,0.20131199359893798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,16,1,power_law_1.2,0.2033087968826294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,2,1,balanced,0.8023573557535807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,2,1,balanced,0.8037919998168945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,2,1,power_law_1.01,0.680294418334961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,2,1,power_law_1.01,0.6856383800506591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,2,1,power_law_1.2,0.6704768180847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,2,1,power_law_1.2,0.6745984077453613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,32,1,balanced,0.19878933827082315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,32,1,balanced,0.19989333550135294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,32,1,power_law_1.01,0.18112640380859374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,32,1,power_law_1.01,0.18298879861831666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,32,1,power_law_1.2,0.18234239816665648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,32,1,power_law_1.2,0.18250880241394044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,4,1,balanced,0.4650133450826009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,4,1,balanced,0.4657226800918579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,4,1,power_law_1.01,0.39825921058654784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,4,1,power_law_1.01,0.39984641075134275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,4,1,power_law_1.2,0.39587199687957764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,4,1,power_law_1.2,0.3968319892883301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,8,1,balanced,0.31226134300231934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,8,1,balanced,0.3129226764043172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,8,1,power_law_1.01,0.2622143983840942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,8,1,power_law_1.01,0.26469759941101073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,8,1,power_law_1.2,0.2609215974807739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2048,8,256,8,1,power_law_1.2,0.2624255895614624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,1,balanced,1.215231974919637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,1,balanced,1.2287253538767497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,1,power_law_1.01,1.0815168380737306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,1,power_law_1.01,1.096083164215088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,1,power_law_1.2,1.1045503616333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,1,power_law_1.2,1.1149760246276856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,16,balanced,0.181002676486969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,16,balanced,0.18378132581710815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,16,power_law_1.01,0.1703935980796814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,16,power_law_1.01,0.17305599451065062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,16,power_law_1.2,0.17200640439987183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,16,power_law_1.2,0.17494399547576905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,2,balanced,0.6569066842397054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,2,balanced,0.6570826768875122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,2,power_law_1.01,0.6009791851043701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,2,power_law_1.01,0.6222976207733154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,2,power_law_1.2,0.6072447776794434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,2,power_law_1.2,0.6169343948364258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,32,balanced,0.12617599964141846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,32,balanced,0.12756266196568808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,32,power_law_1.01,0.12283519506454468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,32,power_law_1.01,0.12429440021514893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,32,power_law_1.2,0.12435840368270874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,32,power_law_1.2,0.12553600072860718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,4,balanced,0.3837653398513794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,4,balanced,0.38683732350667316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,4,power_law_1.01,0.3590656042098999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,4,power_law_1.01,0.371558403968811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,4,power_law_1.2,0.3621952056884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,4,power_law_1.2,0.3632256031036377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,8,balanced,0.2476053237915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,8,balanced,0.24787733952204385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,8,power_law_1.01,0.23135359287261964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,8,power_law_1.01,0.24027519226074218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,8,power_law_1.2,0.2359999895095825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,1,8,power_law_1.2,0.243123197555542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,16,1,balanced,0.1987733244895935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,16,1,balanced,0.19899199406305948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,16,1,power_law_1.01,0.1706112027168274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,16,1,power_law_1.01,0.17242879867553712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,16,1,power_law_1.2,0.18083200454711915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,16,1,power_law_1.2,0.19184000492095948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,2,1,balanced,0.646074652671814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,2,1,balanced,0.6478773355484009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,2,1,power_law_1.01,0.5837247848510743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,2,1,power_law_1.01,0.5873727798461914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,2,1,power_law_1.2,0.5922815799713135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,2,1,power_law_1.2,0.5992191791534424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,32,1,balanced,0.15269333124160767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,32,1,balanced,0.15380799770355225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,32,1,power_law_1.01,0.14439040422439575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,32,1,power_law_1.01,0.14525439739227294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,32,1,power_law_1.2,0.14728319644927979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,32,1,power_law_1.2,0.14755840301513673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,4,1,balanced,0.36934932072957355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,4,1,balanced,0.3706773519515991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,4,1,power_law_1.01,0.34327681064605714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,4,1,power_law_1.01,0.3476416110992432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,4,1,power_law_1.2,0.3532288074493408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,4,1,power_law_1.2,0.3542335987091064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,8,1,balanced,0.23635200659434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,8,1,balanced,0.2384373346964518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,8,1,power_law_1.01,0.2201472043991089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,8,1,power_law_1.01,0.22211201190948487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,8,1,power_law_1.2,0.2253567934036255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,6144,2560,8,160,8,1,power_law_1.2,0.2256511926651001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,1,balanced,1.7715253829956055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,1,balanced,1.7751946449279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,1,power_law_1.01,1.44137601852417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,1,power_law_1.01,1.478495979309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,1,power_law_1.2,1.4674367904663086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,1,power_law_1.2,1.4797183990478515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,128,balanced,0.15426133076349893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,128,balanced,0.15679466724395752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,128,power_law_1.01,0.1533951997756958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,128,power_law_1.01,0.15397119522094727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,128,power_law_1.2,0.15362559556961058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,128,power_law_1.2,0.15423359870910644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,16,balanced,0.26050132513046265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,16,balanced,0.2613813281059265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,16,power_law_1.01,0.24130558967590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,16,power_law_1.01,0.2473599910736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,16,power_law_1.2,0.23703041076660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,16,power_law_1.2,0.24724481105804444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,2,balanced,0.9675467014312744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,2,balanced,0.9792053699493408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,2,power_law_1.01,0.7906239986419678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,2,power_law_1.01,0.816160011291504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,2,power_law_1.2,0.8261183738708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,2,power_law_1.2,0.8625087738037109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,256,balanced,0.15036799510320029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,256,balanced,0.1509066621462504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,256,power_law_1.01,0.1487231969833374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,256,power_law_1.01,0.14904320240020752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,256,power_law_1.2,0.14979200363159179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,256,power_law_1.2,0.15047680139541625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,32,balanced,0.19223467508951822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,32,balanced,0.19264533122380575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,32,power_law_1.01,0.18700799942016602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,32,power_law_1.01,0.18724479675292968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,32,power_law_1.2,0.18248319625854492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,32,power_law_1.2,0.1835904002189636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,4,balanced,0.5588853359222412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,4,balanced,0.5590560038884481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,4,power_law_1.01,0.5114560127258301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,4,power_law_1.01,0.5121600151062011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,4,power_law_1.2,0.5073599815368652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,4,power_law_1.2,0.510207986831665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,64,balanced,0.16237333416938782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,64,balanced,0.162581334511439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,64,power_law_1.01,0.1592128038406372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,64,power_law_1.01,0.1600000023841858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,64,power_law_1.2,0.15971200466156005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,64,power_law_1.2,0.16042879819869996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,8,balanced,0.3593706687291463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,8,balanced,0.36618133385976154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,8,power_law_1.01,0.3272320032119751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,8,power_law_1.01,0.34294400215148924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,8,power_law_1.2,0.31766400337219236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,1,8,power_law_1.2,0.32728960514068606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,16,1,balanced,0.27720000346501666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,16,1,balanced,0.27742934226989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,16,1,power_law_1.01,0.22941439151763915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,16,1,power_law_1.01,0.23176960945129393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,16,1,power_law_1.2,0.22622079849243165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,16,1,power_law_1.2,0.23095040321350097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,2,1,balanced,0.9355359872182211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,2,1,balanced,0.9396373430887858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,2,1,power_law_1.01,0.7786367893218994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,2,1,power_law_1.01,0.7838208198547363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,2,1,power_law_1.2,0.7682112216949463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,2,1,power_law_1.2,0.7792448043823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,32,1,balanced,0.22588799397150675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,32,1,balanced,0.22621333599090576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,32,1,power_law_1.01,0.208076810836792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,32,1,power_law_1.01,0.21024000644683838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,32,1,power_law_1.2,0.20777599811553954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,32,1,power_law_1.2,0.20855040550231935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,4,1,balanced,0.5372053384780884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,4,1,balanced,0.5393919944763184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,4,1,power_law_1.01,0.45889921188354493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,4,1,power_law_1.01,0.46151041984558105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,4,1,power_law_1.2,0.46102399826049806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,4,1,power_law_1.2,0.46251521110534666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,8,1,balanced,0.36095468203226727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,8,1,balanced,0.3617440064748128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,8,1,power_law_1.01,0.3041215896606445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,8,1,power_law_1.01,0.3042880058288574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,8,1,power_law_1.2,0.303385591506958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,256,8,1,power_law_1.2,0.3043776035308838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,1,balanced,2.7068001429239907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,1,balanced,2.7219626108805337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,1,power_law_1.01,2.011494445800781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,1,power_law_1.01,2.0596031188964843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,1,power_law_1.2,1.961644744873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,1,power_law_1.2,2.0048639297485353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,128,balanced,0.21339199940363565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,128,balanced,0.21384533246358237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,128,power_law_1.01,0.2094719886779785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,128,power_law_1.01,0.21095681190490723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,128,power_law_1.2,0.21070079803466796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,128,power_law_1.2,0.21095681190490723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,16,balanced,0.35496000448862713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,16,balanced,0.35787200927734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,16,power_law_1.01,0.32819840908050535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,16,power_law_1.01,0.330841588973999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,16,power_law_1.2,0.311244797706604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,16,power_law_1.2,0.312064003944397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,2,balanced,1.43230406443278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,2,balanced,1.4546292622884114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,2,power_law_1.01,1.0811519622802734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,2,power_law_1.01,1.124019241333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,2,power_law_1.2,1.100601577758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,2,power_law_1.2,1.147430419921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,32,balanced,0.2776106595993042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,32,balanced,0.2781920035680135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,32,power_law_1.01,0.2583168029785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,32,power_law_1.01,0.2650559902191162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,32,power_law_1.2,0.2519040107727051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,32,power_law_1.2,0.2559295892715454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,4,balanced,0.8126933574676514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,4,balanced,0.8141012986501058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,4,power_law_1.01,0.6696256160736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,4,power_law_1.01,0.7113344192504882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,4,power_law_1.2,0.6803840160369873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,4,power_law_1.2,0.6877376079559326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,64,balanced,0.22734399636586508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,64,balanced,0.22805333137512207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,64,power_law_1.01,0.2207808017730713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,64,power_law_1.01,0.2240000009536743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,64,power_law_1.2,0.21879680156707765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,64,power_law_1.2,0.22093439102172852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,8,balanced,0.5131466786066691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,8,balanced,0.5144693454106649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,8,power_law_1.01,0.4648064136505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,8,power_law_1.01,0.48099842071533205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,8,power_law_1.2,0.4402495861053467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,1,8,power_law_1.2,0.45883522033691404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,16,1,balanced,0.3693973223368327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,16,1,balanced,0.3704906702041626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,16,1,power_law_1.01,0.3199359893798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,16,1,power_law_1.01,0.3218496084213257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,16,1,power_law_1.2,0.31832959651947024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,16,1,power_law_1.2,0.31962881088256834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,2,1,balanced,1.356122652689616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,2,1,balanced,1.3917333285013835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,2,1,power_law_1.01,1.0489536285400392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,2,1,power_law_1.01,1.056492805480957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,2,1,power_law_1.2,1.02041597366333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,2,1,power_law_1.2,1.0375871658325195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,32,1,balanced,0.31364800532658893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,32,1,balanced,0.3141973416010539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,32,1,power_law_1.01,0.2705919981002808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,32,1,power_law_1.01,0.270630407333374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,32,1,power_law_1.2,0.2689471960067749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,32,1,power_law_1.2,0.2703423976898193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,4,1,balanced,0.7746720314025879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,4,1,balanced,0.7750720183054606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,4,1,power_law_1.01,0.6186624050140381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,4,1,power_law_1.01,0.6320896148681641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,4,1,power_law_1.2,0.6049920082092285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,4,1,power_law_1.2,0.6171328067779541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,8,1,balanced,0.5058720111846924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,8,1,balanced,0.5089813470840454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,8,1,power_law_1.01,0.41000962257385254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,8,1,power_law_1.01,0.4131904125213623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,8,1,power_law_1.2,0.4065087795257568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,128,7168,2048,8,384,8,1,power_law_1.2,0.4087423801422119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,1,balanced,0.23875733216603598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,1,balanced,0.23913600047429404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,1,power_law_1.01,0.27400960922241213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,1,power_law_1.01,0.27411839962005613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,1,power_law_1.2,0.2808768033981323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,1,power_law_1.2,0.2817408084869385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,128,balanced,0.1195146640141805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,128,balanced,0.12011200189590454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,128,power_law_1.01,0.12182400226593018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,128,power_law_1.01,0.1239743947982788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,128,power_law_1.2,0.12450560331344604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,128,power_law_1.2,0.12481919527053834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,16,balanced,0.12773866454760233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,16,balanced,0.12787733475367227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,16,power_law_1.01,0.13581440448760987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,16,power_law_1.01,0.1365056037902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,16,power_law_1.2,0.13544960021972657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,16,power_law_1.2,0.1368127942085266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,2,balanced,0.18992000818252563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,2,balanced,0.19163199265797934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,2,power_law_1.01,0.21162879467010498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,2,power_law_1.01,0.21298561096191407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,2,power_law_1.2,0.21806719303131103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,2,power_law_1.2,0.21977601051330567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,32,balanced,0.12211199601491292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,32,balanced,0.12261866529782613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,32,power_law_1.01,0.12728320360183715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,32,power_law_1.01,0.12748160362243652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,32,power_law_1.2,0.13040640354156494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,32,power_law_1.2,0.13155200481414794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,4,balanced,0.15600533286730447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,4,balanced,0.15704533457756042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,4,power_law_1.01,0.1701632022857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,4,power_law_1.01,0.17503360509872437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,4,power_law_1.2,0.1741696000099182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,4,power_law_1.2,0.17441920042037964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,64,balanced,0.12012267112731934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,64,balanced,0.12037332852681477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,64,power_law_1.01,0.12372479438781739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,64,power_law_1.01,0.12398079633712769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,64,power_law_1.2,0.1271999955177307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,64,power_law_1.2,0.1272320032119751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,8,balanced,0.13618666927019754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,8,balanced,0.13726400335629782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,8,power_law_1.01,0.14536960124969484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,8,power_law_1.01,0.14877439737319947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,8,power_law_1.2,0.1502527952194214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,1,8,power_law_1.2,0.15194239616394042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,2,1,balanced,0.16887466112772623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,2,1,balanced,0.16977600256601968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,2,1,power_law_1.01,0.19086079597473143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,2,1,power_law_1.01,0.19278080463409425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,2,1,power_law_1.2,0.19731199741363525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,2,1,power_law_1.2,0.19895039796829223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,4,1,balanced,0.14269866545995077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,4,1,balanced,0.1427786648273468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,4,1,power_law_1.01,0.15449600219726561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,4,1,power_law_1.01,0.1570623993873596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,4,1,power_law_1.2,0.15969280004501343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2048,768,8,128,4,1,power_law_1.2,0.16087039709091186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,1,balanced,0.5064533154169718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,1,balanced,0.5073920090993246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,1,power_law_1.01,0.5639039993286132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,1,power_law_1.01,0.5665023803710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,1,power_law_1.2,0.5756288051605225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,1,power_law_1.2,0.5810880184173584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,128,balanced,0.15452800194422403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,128,balanced,0.15601600209871927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,128,power_law_1.01,0.16053119897842408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,128,power_law_1.01,0.16199040412902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,128,power_law_1.2,0.16802560091018676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,128,power_law_1.2,0.16895999908447265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,16,balanced,0.17720532417297363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,16,balanced,0.179967999458313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,16,power_law_1.01,0.19274879693984986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,16,power_law_1.01,0.19421440362930298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,16,power_law_1.2,0.1943295955657959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,16,power_law_1.2,0.19658880233764647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,2,balanced,0.34774935245513916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,2,balanced,0.348410685857137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,2,power_law_1.01,0.3728447914123535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,2,power_law_1.01,0.3772671937942505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,2,power_law_1.2,0.3772032022476196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,2,power_law_1.2,0.3966399908065796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,32,balanced,0.1641866664091746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,32,balanced,0.16455466548601785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,32,power_law_1.01,0.17626240253448486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,32,power_law_1.01,0.17649279832839965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,32,power_law_1.2,0.18119679689407348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,32,power_law_1.2,0.1832128047943115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,4,balanced,0.2596106727917989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,4,balanced,0.26048000653584796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,4,power_law_1.01,0.27693440914154055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,4,power_law_1.01,0.28346240520477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,4,power_law_1.2,0.2829440116882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,4,power_law_1.2,0.285696005821228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,64,balanced,0.15678933262825012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,64,balanced,0.15715733170509338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,64,power_law_1.01,0.16460800170898438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,64,power_law_1.01,0.1672127962112427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,64,power_law_1.2,0.16989439725875854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,64,power_law_1.2,0.17167359590530396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,8,balanced,0.20804800589879355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,8,balanced,0.20946133136749268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,8,power_law_1.01,0.22403841018676757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,8,power_law_1.01,0.22965118885040284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,8,power_law_1.2,0.2328320026397705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,1,8,power_law_1.2,0.23491199016571046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,16,1,balanced,0.8075520197550455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,16,1,balanced,0.8101653258005778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,16,1,power_law_1.01,0.9959232330322265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,16,1,power_law_1.01,1.0082688331604004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,16,1,power_law_1.2,1.0461759567260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,16,1,power_law_1.2,1.0470656394958495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,2,1,balanced,0.3171306649843852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,2,1,balanced,0.3172053297360738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,2,1,power_law_1.01,0.34708480834960936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,2,1,power_law_1.01,0.35425920486450196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,2,1,power_law_1.2,0.3559231996536255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,2,1,power_law_1.2,0.3586816072463989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,32,1,balanced,0.6975626945495605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,32,1,balanced,0.7022506395975748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,32,1,power_law_1.01,0.8691200256347656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,32,1,power_law_1.01,0.8886591911315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,32,1,power_law_1.2,0.9146688461303711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,32,1,power_law_1.2,0.9187775611877441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,4,1,balanced,0.22075200080871582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,4,1,balanced,0.22205867369969687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,4,1,power_law_1.01,0.24366719722747804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,4,1,power_law_1.01,0.2448256015777588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,4,1,power_law_1.2,0.24654719829559327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,4,1,power_law_1.2,0.2473088026046753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,8,1,balanced,1.1026026407877605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,8,1,balanced,1.14082670211792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,8,1,power_law_1.01,1.3440447807312013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,8,1,power_law_1.01,1.3953408241271972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,8,1,power_law_1.2,1.4202624320983888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,2688,1856,6,128,8,1,power_law_1.2,1.4258048057556152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,1,balanced,0.8357280095418295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,1,balanced,0.8484000364939371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,1,power_law_1.01,0.8678463935852051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,1,power_law_1.01,0.8701696395874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,1,power_law_1.2,0.8856127738952637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,1,power_law_1.2,0.9056447982788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,128,balanced,0.20531733830769858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,128,balanced,0.20637865861256918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,128,power_law_1.01,0.20953600406646727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,128,power_law_1.01,0.21055359840393068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,128,power_law_1.2,0.21107840538024902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,128,power_law_1.2,0.21301119327545165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,16,balanced,0.25041067600250244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,16,balanced,0.2508106629053752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,16,power_law_1.01,0.26218879222869873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,16,power_law_1.01,0.2638335943222046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,16,power_law_1.2,0.2675391912460327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,16,power_law_1.2,0.2680511951446533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,2,balanced,0.5409813324610392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,2,balanced,0.5427199999491373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,2,power_law_1.01,0.5586112022399903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,2,power_law_1.01,0.5604159832000732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,2,power_law_1.2,0.5684480190277099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,2,power_law_1.2,0.5684927940368653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,256,balanced,0.20336532592773438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,256,balanced,0.2039573391278585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,256,power_law_1.01,0.20527999401092528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,256,power_law_1.01,0.20631039142608643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,256,power_law_1.2,0.2081536054611206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,256,power_law_1.2,0.20843520164489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,32,balanced,0.22482667366663614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,32,balanced,0.22510933876037598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,32,power_law_1.01,0.23340160846710206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,32,power_law_1.01,0.23383040428161622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,32,power_law_1.2,0.23836801052093506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,32,power_law_1.2,0.23999359607696533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,4,balanced,0.3815466562906901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,4,balanced,0.38173333803812665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,4,power_law_1.01,0.3869375944137573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,4,power_law_1.01,0.3936192035675049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,4,power_law_1.2,0.40424318313598634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,4,power_law_1.2,0.40561280250549314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,64,balanced,0.2107306718826294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,64,balanced,0.21182932456334433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,64,power_law_1.01,0.216377592086792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,64,power_law_1.01,0.21863679885864257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,64,power_law_1.2,0.22203519344329833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,64,power_law_1.2,0.2241919994354248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,8,balanced,0.29356799523035687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,8,balanced,0.2959679961204529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,8,power_law_1.01,0.3034303903579712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,8,power_law_1.01,0.30563840866088865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,8,power_law_1.2,0.3128895998001099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,1,8,power_law_1.2,0.3133824110031128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,16,1,balanced,0.2266026735305786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,16,1,balanced,0.22713599602381387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,16,1,power_law_1.01,0.23434879779815673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,16,1,power_law_1.01,0.2375744104385376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,16,1,power_law_1.2,0.2523519992828369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,16,1,power_law_1.2,0.25241599082946775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,2,1,balanced,0.5071573257446289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,2,1,balanced,0.5076959927876791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,2,1,power_law_1.01,0.515993595123291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,2,1,power_law_1.01,0.524883222579956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,2,1,power_law_1.2,0.5419968128204345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,2,1,power_law_1.2,0.5437376022338867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,32,1,balanced,0.20605866114298502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,32,1,balanced,0.20612800121307373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,32,1,power_law_1.01,0.2149120092391968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,32,1,power_law_1.01,0.2171839952468872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,32,1,power_law_1.2,0.227455997467041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,32,1,power_law_1.2,0.22977919578552247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,4,1,balanced,0.3426400025685628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,4,1,balanced,0.3447466691335042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,4,1,power_law_1.01,0.35089280605316164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,4,1,power_law_1.01,0.35187199115753176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,4,1,power_law_1.2,0.36034560203552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,4,1,power_law_1.2,0.3669568061828613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,8,1,balanced,0.2659893234570821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,8,1,balanced,0.2663840055465698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,8,1,power_law_1.01,0.27470719814300537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,8,1,power_law_1.01,0.27487359046936033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,8,1,power_law_1.2,0.2896895885467529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,3072,1536,8,256,8,1,power_law_1.2,0.2930943965911865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,1,balanced,0.784991979598999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,1,balanced,0.7901386419932047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,1,power_law_1.01,0.8642815589904785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,1,power_law_1.01,0.8782208442687989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,1,power_law_1.2,0.8693056106567383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,1,power_law_1.2,0.8840703964233398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,2,balanced,0.5185013214747111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,2,balanced,0.5209866762161255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,2,power_law_1.01,0.6110655784606933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,2,power_law_1.01,0.6159743785858154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,2,power_law_1.2,0.6237184047698975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,2,power_law_1.2,0.658784008026123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,4,balanced,0.3654293219248454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,4,balanced,0.3678079843521118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,4,power_law_1.01,0.5273344039916992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,4,power_law_1.01,0.5342400074005127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,4,power_law_1.2,0.5181759834289551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,4,power_law_1.2,0.535481595993042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,8,balanced,0.321125328540802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,8,balanced,0.32130134105682373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,8,power_law_1.01,0.4513279914855957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,8,power_law_1.01,0.48919038772583007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,8,power_law_1.2,0.4895808219909668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,1,8,power_law_1.2,0.49441280364990237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,16,1,balanced,0.11512533823649089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,16,1,balanced,0.11560533444086711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,16,1,power_law_1.01,0.11960959434509277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,16,1,power_law_1.2,0.11808639764785767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,16,1,power_law_1.2,0.12019840478897095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,2,1,balanced,0.42149333159128827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,2,1,balanced,0.42261866728464764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,2,1,power_law_1.01,0.46924800872802735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,2,1,power_law_1.01,0.4755199909210205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,2,1,power_law_1.2,0.45757441520690917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,2,1,power_law_1.2,0.4635647773742676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,32,1,balanced,0.08724799752235413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,32,1,balanced,0.08788800239562988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,32,1,power_law_1.01,0.08965759873390197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,32,1,power_law_1.01,0.09143679738044738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,32,1,power_law_1.2,0.09086719751358033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,32,1,power_law_1.2,0.09207040071487427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,4,1,balanced,0.23747199773788452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,4,1,balanced,0.24162666002909342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,4,1,power_law_1.01,0.2670655965805054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,4,1,power_law_1.01,0.2681663990020752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,4,1,power_law_1.2,0.2644160032272339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,4,1,power_law_1.2,0.26645760536193847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,8,1,balanced,0.15454933047294617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,8,1,balanced,0.15503467122713724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,8,1,power_law_1.01,0.16467200517654418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,8,1,power_law_1.01,0.1657663941383362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,8,1,power_law_1.2,0.16416640281677247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,14336,2,8,8,1,power_law_1.2,0.16457600593566896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,1,balanced,0.6242560148239136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,1,balanced,0.6276640097300211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,1,power_law_1.01,0.7283135890960694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,1,power_law_1.01,0.7475391864776612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,1,power_law_1.2,0.7550399780273438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,1,power_law_1.2,0.7572735786437989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,128,balanced,0.19928000370661417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,128,balanced,0.20125333468119302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,128,power_law_1.01,0.2092288017272949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,128,power_law_1.01,0.2122431993484497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,128,power_law_1.2,0.22074880599975585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,128,power_law_1.2,0.2218048095703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,16,balanced,0.2241706649462382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,16,balanced,0.22444800535837808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,16,power_law_1.01,0.24217600822448732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,16,power_law_1.01,0.25182719230651857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,16,power_law_1.2,0.25157120227813723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,16,power_law_1.2,0.25858559608459475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,2,balanced,0.43187201023101807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,2,balanced,0.43386133511861164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,2,power_law_1.01,0.49640960693359376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,2,power_law_1.01,0.4988351821899414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,2,power_law_1.2,0.5025536060333252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,2,power_law_1.2,0.510752010345459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,32,balanced,0.20862932999928793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,32,balanced,0.21034133434295654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,32,power_law_1.01,0.22990078926086427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,32,power_law_1.01,0.23228158950805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,32,power_law_1.2,0.23875839710235597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,32,power_law_1.2,0.23922560214996338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,4,balanced,0.31549866994222003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,4,balanced,0.3157973289489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,4,power_law_1.01,0.35999360084533694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,4,power_law_1.01,0.36170239448547364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,4,power_law_1.2,0.3674623966217041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,4,power_law_1.2,0.3790015935897827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,64,balanced,0.20332266887029013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,64,balanced,0.20422399044036865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,64,power_law_1.01,0.21573760509490966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,64,power_law_1.01,0.22354559898376464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,64,power_law_1.2,0.2207360029220581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,64,power_law_1.2,0.22709760665893555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,8,balanced,0.25498666365941364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,8,balanced,0.2584853370984395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,8,power_law_1.01,0.28628480434417725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,8,power_law_1.01,0.2918976068496704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,8,power_law_1.2,0.2892863988876343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,1,8,power_law_1.2,0.29285120964050293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,16,1,balanced,0.1965706745783488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,16,1,balanced,0.1982826590538025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,16,1,power_law_1.01,0.231660795211792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,16,1,power_law_1.01,0.23313920497894286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,16,1,power_law_1.2,0.23459200859069823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,16,1,power_law_1.2,0.23462400436401368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,2,1,balanced,0.3970133463541667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,2,1,balanced,0.39928531646728516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,2,1,power_law_1.01,0.4586048126220703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,2,1,power_law_1.01,0.4615935802459717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,2,1,power_law_1.2,0.46160640716552737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,2,1,power_law_1.2,0.47019519805908205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,32,1,balanced,0.18888533115386963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,32,1,balanced,0.1909760038057963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,32,1,power_law_1.01,0.20943999290466309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,32,1,power_law_1.01,0.21116158962249756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,32,1,power_law_1.2,0.21193599700927734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,32,1,power_law_1.2,0.2122112035751343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,4,1,balanced,0.2787040074666341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,4,1,balanced,0.27993067105611164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,4,1,power_law_1.01,0.3171135902404785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,4,1,power_law_1.01,0.31712000370025634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,4,1,power_law_1.2,0.32602241039276125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,4,1,power_law_1.2,0.3316096067428589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,8,1,balanced,0.232640008131663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,8,1,balanced,0.23376532395680746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,8,1,power_law_1.01,0.2546688079833984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,8,1,power_law_1.01,0.2551424026489258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,8,1,power_law_1.2,0.26465280055999757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,1536,8,128,8,1,power_law_1.2,0.2661504030227661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,1,balanced,3.866688092549642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,1,balanced,3.934549331665039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,1,power_law_1.01,4.145888137817383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,1,power_law_1.01,4.1847999572753904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,1,power_law_1.2,4.325612640380859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,1,power_law_1.2,4.384518432617187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,128,balanced,0.7220426400502523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,128,balanced,0.7221333185831705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,128,power_law_1.01,0.7461567878723144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,128,power_law_1.01,0.7490431785583496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,128,power_law_1.2,0.7485311985015869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,128,power_law_1.2,0.7546815872192383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,16,balanced,0.8948000272115072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,16,balanced,0.8989813327789307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,16,power_law_1.01,0.9450048446655274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,16,power_law_1.01,0.9455360412597656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,16,power_law_1.2,0.9630592346191407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,16,power_law_1.2,0.9680064201354981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,2,balanced,2.2223092714945474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,2,balanced,2.234288056691488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,2,power_law_1.01,2.4367040634155273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,2,power_law_1.01,2.4410240173339846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,2,power_law_1.2,2.536147117614746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,2,power_law_1.2,2.565817642211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,256,balanced,0.7136586507161459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,256,balanced,0.7138240337371826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,256,power_law_1.01,0.7302464008331299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,256,power_law_1.01,0.7311552047729493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,256,power_law_1.2,0.7387135982513428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,256,power_law_1.2,0.7427840232849121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,32,balanced,0.7969386577606201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,32,balanced,0.80131729443868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,32,power_law_1.01,0.8363903999328614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,32,power_law_1.01,0.8386495590209961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,32,power_law_1.2,0.8512384414672851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,32,power_law_1.2,0.8570367813110351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,4,balanced,1.4533599217732747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,4,balanced,1.4553866386413574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,4,power_law_1.01,1.5506879806518554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,4,power_law_1.01,1.5869888305664062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,4,power_law_1.2,1.6321792602539062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,4,power_law_1.2,1.6368255615234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,64,balanced,0.747920036315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,64,balanced,0.7505066394805908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,64,power_law_1.01,0.7774144172668457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,64,power_law_1.01,0.7774400234222412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,64,power_law_1.2,0.7918591976165772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,64,power_law_1.2,0.79203200340271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,8,balanced,1.0876266956329346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,8,balanced,1.092303991317749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,8,power_law_1.01,1.1490240097045898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,8,power_law_1.01,1.1612735748291017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,8,power_law_1.2,1.1671744346618653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,1,8,power_law_1.2,1.1848064422607423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,16,1,balanced,5.883066813151042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,16,1,balanced,6.268197377522786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,16,1,power_law_1.01,7.3945152282714846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,16,1,power_law_1.01,7.441657257080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,16,1,power_law_1.2,7.734976196289063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,16,1,power_law_1.2,7.779443359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,2,1,balanced,2.0325867335001626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,2,1,balanced,2.1184852917989097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,2,1,power_law_1.01,2.2042688369750976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,2,1,power_law_1.01,2.248480033874512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,2,1,power_law_1.2,2.3101312637329103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,2,1,power_law_1.2,2.315603256225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,32,1,balanced,4.099439938863118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,32,1,balanced,4.166607856750488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,32,1,power_law_1.01,5.0593406677246096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,32,1,power_law_1.01,5.069158554077148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,32,1,power_law_1.2,5.257952117919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,32,1,power_law_1.2,5.288832092285157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,4,1,balanced,1.249402681986491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,4,1,balanced,1.2507200241088867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,4,1,power_law_1.01,1.390233612060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,4,1,power_law_1.01,1.3965951919555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,4,1,power_law_1.2,1.4243455886840821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,4,1,power_law_1.2,1.4311552047729492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,8,1,balanced,0.8611413637797037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,8,1,balanced,0.8620213667551676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,8,1,power_law_1.01,0.9524095535278321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,8,1,power_law_1.01,0.9554816246032715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,8,1,power_law_1.2,0.9759936332702637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,4096,2688,22,512,8,1,power_law_1.2,0.9790592193603516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,1,balanced,1.2303893566131592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,1,balanced,1.233680009841919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,1,power_law_1.01,1.348703956604004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,1,power_law_1.01,1.3716799736022949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,1,power_law_1.2,1.3438400268554687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,1,power_law_1.2,1.3463680267333984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,2,balanced,0.7142666975657145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,2,balanced,0.7280373573303223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,2,power_law_1.01,0.877683162689209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,2,power_law_1.01,1.0461503982543945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,2,power_law_1.2,0.919980812072754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,2,power_law_1.2,1.0064767837524413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,4,balanced,0.46674664815266925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,4,balanced,0.4733440081278483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,4,power_law_1.01,0.707263994216919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,4,power_law_1.01,0.7130559921264649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,4,power_law_1.2,0.7089344024658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,4,power_law_1.2,0.756550407409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,8,balanced,0.38838398456573486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,8,balanced,0.3940693140029907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,8,power_law_1.01,0.59683837890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,8,power_law_1.01,0.6419328212738037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,8,power_law_1.2,0.5929279804229737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,1,8,power_law_1.2,0.6590144157409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,16,1,balanced,0.15901333093643188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,16,1,balanced,0.16249066591262817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,16,1,power_law_1.01,0.16323200464248658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,16,1,power_law_1.01,0.16442879438400268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,16,1,power_law_1.2,0.16344959735870362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,16,1,power_law_1.2,0.16447999477386474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,2,1,balanced,0.6360053221384684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,2,1,balanced,0.6430826584498087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,2,1,power_law_1.01,0.7172031879425049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,2,1,power_law_1.01,0.7240960121154785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,2,1,power_law_1.2,0.7006656169891358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,2,1,power_law_1.2,0.7288640022277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,32,1,balanced,0.11712533235549927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,32,1,balanced,0.11730133493741353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,32,1,power_law_1.01,0.11889920234680176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,32,1,power_law_1.01,0.11990400552749633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,32,1,power_law_1.2,0.11964800357818603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,32,1,power_law_1.2,0.11972479820251465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,4,1,balanced,0.35974399248758954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,4,1,balanced,0.3635573387145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,4,1,power_law_1.01,0.3915519952774048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,4,1,power_law_1.01,0.39628798961639405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,4,1,power_law_1.2,0.3926527976989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,4,1,power_law_1.2,0.39407360553741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,8,1,balanced,0.2214613358179728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,8,1,balanced,0.22234666347503662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,8,1,power_law_1.01,0.24676480293273925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,8,1,power_law_1.01,0.24715518951416016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,8,1,power_law_1.2,0.24216320514678955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,16384,2,8,8,1,power_law_1.2,0.24498560428619384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,1,balanced,2.0560800234476724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,1,balanced,2.0803200403849282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,1,power_law_1.01,2.054681587219238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,1,power_law_1.01,2.0619583129882812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,1,power_law_1.2,2.178598403930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,1,power_law_1.2,2.216320037841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,128,balanced,0.3278506596883138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,128,balanced,0.3304640054702759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,128,power_law_1.01,0.3384063959121704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,128,power_law_1.01,0.34250240325927733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,128,power_law_1.2,0.3475647926330566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,128,power_law_1.2,0.34822399616241456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,16,balanced,0.42981334527333576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,16,balanced,0.4306666851043701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,16,power_law_1.01,0.4501952171325684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,16,power_law_1.01,0.45274882316589354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,16,power_law_1.2,0.46122241020202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,16,power_law_1.2,0.46613759994506837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,2,balanced,1.1791626612345378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,2,balanced,1.191327969233195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,2,power_law_1.01,1.2179264068603515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,2,power_law_1.01,1.2411392211914063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,2,power_law_1.2,1.2926143646240233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,2,power_law_1.2,1.3089216232299805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,256,balanced,0.3233120044072469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,256,balanced,0.32449066638946533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,256,power_law_1.01,0.33178880214691164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,256,power_law_1.01,0.33235199451446534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,256,power_law_1.2,0.34143359661102296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,256,power_law_1.2,0.34254720211029055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,32,balanced,0.3712746699651082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,32,balanced,0.3720639944076538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,32,power_law_1.01,0.3885951995849609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,32,power_law_1.01,0.39210240840911864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,32,power_law_1.2,0.39738240242004397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,32,power_law_1.2,0.398636794090271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,4,balanced,0.7580320040384928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,4,balanced,0.7614826361338297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,4,power_law_1.01,0.7833151817321777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,4,power_law_1.01,0.7899712085723877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,4,power_law_1.2,0.8174400329589844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,4,power_law_1.2,0.820076847076416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,64,balanced,0.3406613270441691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,64,balanced,0.34115731716156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,64,power_law_1.01,0.3553215980529785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,64,power_law_1.01,0.3571775913238525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,64,power_law_1.2,0.36632959842681884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,64,power_law_1.2,0.37183361053466796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,8,balanced,0.5375306606292725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,8,balanced,0.5412533283233643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,8,power_law_1.01,0.5628096103668213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,8,power_law_1.01,0.5631103992462159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,8,power_law_1.2,0.5792064189910888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,1,8,power_law_1.2,0.5846399784088134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,16,1,balanced,0.4038506746292114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,16,1,balanced,0.4057653347651164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,16,1,power_law_1.01,0.41785597801208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,16,1,power_law_1.01,0.4189760208129883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,16,1,power_law_1.2,0.4496448040008545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,16,1,power_law_1.2,0.4534912109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,2,1,balanced,1.121888001759847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,2,1,balanced,1.1220959822336833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,2,1,power_law_1.01,1.1559295654296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,2,1,power_law_1.01,1.1731391906738282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,2,1,power_law_1.2,1.2087615966796874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,2,1,power_law_1.2,1.221951961517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,32,1,balanced,0.36286401748657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,32,1,balanced,0.36370666821797687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,32,1,power_law_1.01,0.37384960651397703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,32,1,power_law_1.01,0.37832961082458494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,32,1,power_law_1.2,0.39760000705718995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,32,1,power_law_1.2,0.4111743927001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,4,1,balanced,0.6994667053222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,4,1,balanced,0.7005173365275065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,4,1,power_law_1.01,0.7303743839263916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,4,1,power_law_1.01,0.7318975925445557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,4,1,power_law_1.2,0.7571072101593017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,4,1,power_law_1.2,0.7655935764312745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,8,1,balanced,0.5092159907023112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,8,1,balanced,0.5100746552149454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,8,1,power_law_1.01,0.5222720146179199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,8,1,power_law_1.01,0.5243391990661621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,8,1,power_law_1.2,0.5388544082641602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2048,8,256,8,1,power_law_1.2,0.5561535835266114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,1,balanced,1.6518826484680176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,1,balanced,1.7045386632283528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,1,power_law_1.01,1.850227165222168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,1,power_law_1.01,1.8841983795166015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,1,power_law_1.2,1.9323968887329102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,1,power_law_1.2,1.959552001953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,16,balanced,0.3876906633377075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,16,balanced,0.38782934347788495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,16,power_law_1.01,0.4296127796173096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,16,power_law_1.01,0.43123841285705566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,16,power_law_1.2,0.4474944114685059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,16,power_law_1.2,0.4578432083129883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,2,balanced,0.9829066594441732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,2,balanced,0.9852960109710693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,2,power_law_1.01,1.1246784210205079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,2,power_law_1.01,1.1323583602905274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,2,power_law_1.2,1.1394816398620606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,2,power_law_1.2,1.1809280395507813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,32,balanced,0.34142398834228516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,32,balanced,0.3426986535390218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,32,power_law_1.01,0.37179520130157473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,32,power_law_1.01,0.38537600040435793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,32,power_law_1.2,0.385913610458374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,32,power_law_1.2,0.3940927982330322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,4,balanced,0.6459093491236368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,4,balanced,0.6484213272730509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,4,power_law_1.01,0.721062421798706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,4,power_law_1.01,0.7315648078918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,4,power_law_1.2,0.7625664234161377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,4,power_law_1.2,0.764518404006958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,8,balanced,0.4766293366750081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,8,balanced,0.4789919853210449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,8,power_law_1.01,0.5379519939422608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,8,power_law_1.01,0.5396863937377929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,8,power_law_1.2,0.5535935878753662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,1,8,power_law_1.2,0.5583231925964356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,16,1,balanced,0.34695998827616376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,16,1,balanced,0.34721068541208905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,16,1,power_law_1.01,0.40027518272399903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,16,1,power_law_1.01,0.4005568027496338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,16,1,power_law_1.2,0.40351362228393556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,16,1,power_law_1.2,0.406828784942627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,2,1,balanced,0.9185173511505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,2,1,balanced,0.9226720333099365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,2,1,power_law_1.01,1.0529536247253417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,2,1,power_law_1.01,1.0601792335510254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,2,1,power_law_1.2,1.0757696151733398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,2,1,power_law_1.2,1.0837568283081054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,32,1,balanced,0.31710400183995563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,32,1,balanced,0.31858134269714355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,32,1,power_law_1.01,0.3477567911148071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,32,1,power_law_1.01,0.34858880043029783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,32,1,power_law_1.2,0.35180160999298093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,32,1,power_law_1.2,0.35204479694366453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,4,1,balanced,0.5820266803105673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,4,1,balanced,0.5825920104980469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,4,1,power_law_1.01,0.6628479957580566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,4,1,power_law_1.01,0.6644864082336426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,4,1,power_law_1.2,0.6746496200561524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,4,1,power_law_1.2,0.67642240524292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,8,1,balanced,0.41201599438985187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,8,1,balanced,0.41272000471750897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,8,1,power_law_1.01,0.46737279891967776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,8,1,power_law_1.01,0.4689216136932373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,8,1,power_law_1.2,0.47031679153442385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,6144,2560,8,160,8,1,power_law_1.2,0.47295360565185546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,1,balanced,2.3631359736124673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,1,balanced,2.3981706301371255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,1,power_law_1.01,2.4077312469482424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,1,power_law_1.01,2.426310348510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,1,power_law_1.2,2.5030527114868164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,1,power_law_1.2,2.5867647171020507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,128,balanced,0.35895999272664386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,128,balanced,0.3590773344039917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,128,power_law_1.01,0.37309439182281495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,128,power_law_1.01,0.37525119781494143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,128,power_law_1.2,0.38213119506835935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,128,power_law_1.2,0.3852672100067139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,16,balanced,0.47678931554158527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,16,balanced,0.47778133551279706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,16,power_law_1.01,0.4999231815338135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,16,power_law_1.01,0.5063615798950195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,16,power_law_1.2,0.511359977722168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,16,power_law_1.2,0.5237120151519775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,2,balanced,1.3666186332702637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,2,balanced,1.38373867670695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,2,power_law_1.01,1.3857600212097168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,2,power_law_1.01,1.3988287925720215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,2,power_law_1.2,1.4707008361816407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,2,power_law_1.2,1.477849578857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,256,balanced,0.3531573216120402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,256,balanced,0.3550560077031453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,256,power_law_1.01,0.3616640090942383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,256,power_law_1.01,0.3645375967025757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,256,power_law_1.2,0.3732480049133301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,256,power_law_1.2,0.37525119781494143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,32,balanced,0.4064799944559733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,32,balanced,0.4068959951400757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,32,power_law_1.01,0.42254080772399905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,32,power_law_1.01,0.43277440071105955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,32,power_law_1.2,0.44196481704711915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,32,power_law_1.2,0.44433279037475587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,4,balanced,0.8559093475341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,4,balanced,0.8577173550923666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,4,power_law_1.01,0.8871232032775879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,4,power_law_1.01,0.8897855758666993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,4,power_law_1.2,0.9221440315246582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,4,power_law_1.2,0.9423359870910645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,64,balanced,0.37139733632405597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,64,balanced,0.3731253147125244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,64,power_law_1.01,0.39204480648040774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,64,power_law_1.01,0.39223039150238037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,64,power_law_1.2,0.3998847961425781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,64,power_law_1.2,0.40372481346130373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,8,balanced,0.6040159861246744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,8,balanced,0.6051413218180338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,8,power_law_1.01,0.6317887783050538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,8,power_law_1.01,0.633081579208374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,8,power_law_1.2,0.6407616138458252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,1,8,power_law_1.2,0.6569791793823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,16,1,balanced,0.4617226521174113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,16,1,balanced,0.4628266493479411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,16,1,power_law_1.01,0.47895040512084963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,16,1,power_law_1.01,0.4814784049987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,16,1,power_law_1.2,0.5123072147369385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,16,1,power_law_1.2,0.5156415939331055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,2,1,balanced,1.2881706555684407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,2,1,balanced,1.301584005355835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,2,1,power_law_1.01,1.3389056205749512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,2,1,power_law_1.01,1.3502079963684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,2,1,power_law_1.2,1.3971967697143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,2,1,power_law_1.2,1.4048447608947754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,32,1,balanced,0.41306666533152264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,32,1,balanced,0.41360533237457275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,32,1,power_law_1.01,0.4332287788391113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,32,1,power_law_1.01,0.43422718048095704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,32,1,power_law_1.2,0.4685311794281006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,32,1,power_law_1.2,0.46906242370605467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,4,1,balanced,0.8035199642181396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,4,1,balanced,0.8035679658253988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,4,1,power_law_1.01,0.8368767738342285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,4,1,power_law_1.01,0.8410431861877441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,4,1,power_law_1.2,0.8813759803771972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,4,1,power_law_1.2,0.8844736099243165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,8,1,balanced,0.5860373179117838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,8,1,balanced,0.5867626667022705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,8,1,power_law_1.01,0.6007999897003173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,8,1,power_law_1.01,0.605676794052124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,8,1,power_law_1.2,0.6191423892974853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,256,8,1,power_law_1.2,0.6413119792938232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,1,balanced,3.610117276509603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,1,balanced,3.6388107935587564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,1,power_law_1.01,3.255052947998047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,1,power_law_1.01,3.2991424560546876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,1,power_law_1.2,3.3114944458007813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,1,power_law_1.2,3.4921470642089845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,128,balanced,0.42293866475423175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,128,balanced,0.423311988512675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,128,power_law_1.01,0.43283839225769044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,128,power_law_1.01,0.4330751895904541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,128,power_law_1.2,0.4408576011657715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,128,power_law_1.2,0.44190077781677245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,16,balanced,0.5950293143590292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,16,balanced,0.5961546500523885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,16,power_law_1.01,0.5813183784484863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,16,power_law_1.01,0.5998015880584717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,16,power_law_1.2,0.6114240169525147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,16,power_law_1.2,0.6159615993499756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,2,balanced,1.8923412958780925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,2,balanced,1.9297919273376465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,2,power_law_1.01,1.795955276489258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,2,power_law_1.01,1.806528091430664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,2,power_law_1.2,1.885273551940918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,2,power_law_1.2,1.8945152282714843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,32,balanced,0.5025120178858439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,32,balanced,0.5025333166122437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,32,power_law_1.01,0.5094336032867431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,32,power_law_1.01,0.5119232177734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,32,power_law_1.2,0.5203519821166992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,32,power_law_1.2,0.5246975898742676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,4,balanced,1.1541546980539958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,4,balanced,1.155834674835205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,4,power_law_1.01,1.0810560226440429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,4,power_law_1.01,1.1116671562194824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,4,power_law_1.2,1.1452287673950194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,4,power_law_1.2,1.1511679649353028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,64,balanced,0.44650665918986004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,64,balanced,0.44707198937733966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,64,power_law_1.01,0.4618175983428955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,64,power_law_1.01,0.4634751796722412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,64,power_law_1.2,0.4671679973602295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,64,power_law_1.2,0.4683072090148926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,8,balanced,0.7890453338623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,8,balanced,0.7890666325887045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,8,power_law_1.01,0.7688640117645263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,8,power_law_1.01,0.7784768104553222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,8,power_law_1.2,0.7883456230163575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,1,8,power_law_1.2,0.7998528003692627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,16,1,balanced,0.6254186630249023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,16,1,balanced,0.6268106698989868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,16,1,power_law_1.01,0.6076416015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,16,1,power_law_1.01,0.6093503952026367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,16,1,power_law_1.2,0.6255231857299804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,16,1,power_law_1.2,0.631283187866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,2,1,balanced,1.8869867324829102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,2,1,balanced,1.950112024943034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,2,1,power_law_1.01,1.7263616561889648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,2,1,power_law_1.01,1.7331199645996094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,2,1,power_law_1.2,1.8040512084960938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,2,1,power_law_1.2,1.831270408630371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,32,1,balanced,0.5679146846135458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,32,1,balanced,0.5688693523406982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,32,1,power_law_1.01,0.5507391929626465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,32,1,power_law_1.01,0.5539648056030273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,32,1,power_law_1.2,0.5622079849243165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,32,1,power_law_1.2,0.5666495800018311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,4,1,balanced,1.1342720190684001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,4,1,balanced,1.1384373505910237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,4,1,power_law_1.01,1.0752063751220704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,4,1,power_law_1.01,1.08023042678833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,4,1,power_law_1.2,1.0991168022155762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,4,1,power_law_1.2,1.1204799652099608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,8,1,balanced,0.8024106820424398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,8,1,balanced,0.8026879628499349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,8,1,power_law_1.01,0.7444608211517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,8,1,power_law_1.01,0.7806528091430665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,8,1,power_law_1.2,0.7846528053283691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,1536,7168,2048,8,384,8,1,power_law_1.2,0.7926527976989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,1,balanced,0.13147733608881632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,1,balanced,0.13157866398493448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,1,power_law_1.01,0.08321279883384705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,1,power_law_1.01,0.08423039913177491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,1,power_law_1.2,0.08090879917144775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,1,power_law_1.2,0.08107519745826722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,128,balanced,0.027642667293548584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,128,balanced,0.02942399928967158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,128,power_law_1.01,0.027020800113677978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,128,power_law_1.01,0.028089600801467895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,128,power_law_1.2,0.026739200949668883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,128,power_law_1.2,0.02736000120639801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,16,balanced,0.033200000723203026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,16,balanced,0.03359466542800268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,16,power_law_1.01,0.029977598786354066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,16,power_law_1.01,0.030604800581932066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,16,power_law_1.2,0.0302592009305954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,16,power_law_1.2,0.03118079900741577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,2,balanced,0.0867039958635966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,2,balanced,0.08683733145395915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,2,power_law_1.01,0.058976000547409056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,2,power_law_1.01,0.06056320071220398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,2,power_law_1.2,0.055852800607681274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,2,power_law_1.2,0.059520000219345094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,32,balanced,0.031498665610949196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,32,balanced,0.03166399896144867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,32,power_law_1.01,0.027859199047088622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,32,power_law_1.01,0.028652799129486085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,32,power_law_1.2,0.028883200883865357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,32,power_law_1.2,0.02917119860649109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,4,balanced,0.058464000622431435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,4,balanced,0.0588266650835673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,4,power_law_1.01,0.04666880071163178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,4,power_law_1.01,0.04687359929084778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,4,power_law_1.2,0.04297600090503693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,4,power_law_1.2,0.045561599731445315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,64,balanced,0.029205332199732464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,64,balanced,0.029477333029111225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,64,power_law_1.01,0.027724799513816834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,64,power_law_1.01,0.027910399436950683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,64,power_law_1.2,0.02778240144252777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,64,power_law_1.2,0.028166401386260986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,8,balanced,0.03942399968703588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,8,balanced,0.041834667325019836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,8,power_law_1.01,0.03427839875221252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,8,power_law_1.01,0.03596799969673157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,8,power_law_1.2,0.033055999875068666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,1,8,power_law_1.2,0.036735999584198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,2,1,balanced,0.086709330479304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,2,1,balanced,0.08782399694124858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,2,1,power_law_1.01,0.05612159967422485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,2,1,power_law_1.01,0.056569600105285646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,2,1,power_law_1.2,0.05308160185813904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,2,1,power_law_1.2,0.05330560207366943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,4,1,balanced,0.061253334085146584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,4,1,balanced,0.06259199976921082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,4,1,power_law_1.01,0.042342400550842284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,4,1,power_law_1.01,0.043731200695037845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,4,1,power_law_1.2,0.039680001139640805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2048,768,8,128,4,1,power_law_1.2,0.03989759981632233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,1,balanced,0.2509866754213969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,1,balanced,0.25228265921274823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,1,power_law_1.01,0.17244800329208373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,1,power_law_1.01,0.17274880409240723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,1,power_law_1.2,0.1568063974380493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,1,power_law_1.2,0.1578495979309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,128,balanced,0.0327360009153684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,128,balanced,0.03332799921433131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,128,power_law_1.01,0.031488001346588135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,128,power_law_1.01,0.031513598561286923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,128,power_law_1.2,0.03139840066432953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,128,power_law_1.2,0.031974399089813234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,16,balanced,0.04451733330885569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,16,balanced,0.045882667104403176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,16,power_law_1.01,0.045849600434303285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,16,power_law_1.01,0.046803200244903566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,16,power_law_1.2,0.04136959910392761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,16,power_law_1.2,0.04714879989624023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,2,balanced,0.147407998641332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,2,balanced,0.14788267016410828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,2,power_law_1.01,0.11195520162582398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,2,power_law_1.01,0.11294080018997192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,2,power_law_1.2,0.10708479881286621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,2,power_law_1.2,0.10758399963378906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,32,balanced,0.037402667105197906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,32,balanced,0.03757333258787791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,32,power_law_1.01,0.036108800768852235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,32,power_law_1.01,0.0364544004201889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,32,power_law_1.2,0.035148799419403076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,32,power_law_1.2,0.03635840117931366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,4,balanced,0.09802132844924927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,4,balanced,0.10009066263834636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,4,power_law_1.01,0.08755840063095092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,4,power_law_1.01,0.08900480270385742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,4,power_law_1.2,0.08344320058822632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,4,power_law_1.2,0.08387839794158936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,64,balanced,0.03558400024970373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,64,balanced,0.03565333286921183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,64,power_law_1.01,0.03359360098838806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,64,power_law_1.01,0.034195199608802795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,64,power_law_1.2,0.03333120048046112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,64,power_law_1.2,0.03395200073719025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,8,balanced,0.06442133088906606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,8,balanced,0.06494933366775513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,8,power_law_1.01,0.060198402404785155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,8,power_law_1.01,0.06410239934921265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,8,power_law_1.2,0.061388802528381345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,1,8,power_law_1.2,0.07120640277862549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,16,1,balanced,0.16061866283416748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,16,1,balanced,0.1606666644414266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,16,1,power_law_1.01,0.1090880036354065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,16,1,power_law_1.01,0.11188479661941528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,16,1,power_law_1.2,0.09713280200958252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,16,1,power_law_1.2,0.10133119821548461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,2,1,balanced,0.14684266845385233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,2,1,balanced,0.14696533481280008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,2,1,power_law_1.01,0.10401279926300049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,2,1,power_law_1.01,0.10442880392074586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,2,1,power_law_1.2,0.0995136022567749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,2,1,power_law_1.2,0.1003775954246521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,32,1,balanced,0.14922133088111877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,32,1,balanced,0.1504533290863037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,32,1,power_law_1.01,0.09940479993820191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,32,1,power_law_1.01,0.10166399478912354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,32,1,power_law_1.2,0.08899840116500854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,32,1,power_law_1.2,0.09485440254211426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,4,1,balanced,0.10078400373458862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,4,1,balanced,0.10121066371599834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,4,1,power_law_1.01,0.0705024003982544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,4,1,power_law_1.01,0.0720192015171051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,4,1,power_law_1.2,0.06727039813995361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,4,1,power_law_1.2,0.06741120219230652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,8,1,balanced,0.19763733943303427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,8,1,balanced,0.19808000326156616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,8,1,power_law_1.01,0.1299008011817932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,8,1,power_law_1.01,0.13292160034179687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,8,1,power_law_1.2,0.12052479982376099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,2688,1856,6,128,8,1,power_law_1.2,0.12171519994735717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,1,balanced,0.3105226755142212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,1,balanced,0.3525173266728719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,1,power_law_1.01,0.24298880100250245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,1,power_law_1.01,0.24410240650177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,1,power_law_1.2,0.2157439947128296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,1,power_law_1.2,0.2239680051803589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,128,balanced,0.033333333830038704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,128,balanced,0.03349333256483078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,128,power_law_1.01,0.03187839984893799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,128,power_law_1.01,0.03201920092105866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,128,power_law_1.2,0.03224959969520569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,128,power_law_1.2,0.03244799971580505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,16,balanced,0.05358933409055074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,16,balanced,0.053904001911481224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,16,power_law_1.01,0.06761599779129028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,16,power_law_1.01,0.07149440050125122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,16,power_law_1.2,0.07039999961853027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,16,power_law_1.2,0.07109119892120361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,2,balanced,0.1821333368619283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,2,balanced,0.18308266003926596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,2,power_law_1.01,0.15987199544906616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,2,power_law_1.01,0.16361600160598755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,2,power_law_1.2,0.14536319971084594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,2,power_law_1.2,0.1476096034049988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,256,balanced,0.03156800071398417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,256,balanced,0.031583999594052635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,256,power_law_1.01,0.031763198971748355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,256,power_law_1.01,0.0319680005311966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,256,power_law_1.2,0.031148800253868104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,256,power_law_1.2,0.03162879943847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,32,balanced,0.03759466608365377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,32,balanced,0.03888533264398575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,32,power_law_1.01,0.049030399322509764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,32,power_law_1.01,0.05175039768218994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,32,power_law_1.2,0.04531840085983276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,32,power_law_1.2,0.05076479911804199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,4,balanced,0.11242133378982544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,4,balanced,0.11329600214958191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,4,power_law_1.01,0.10371840000152588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,4,power_law_1.01,0.1134719967842102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,4,power_law_1.2,0.11269760131835938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,4,power_law_1.2,0.11847039461135864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,64,balanced,0.03332266708215078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,64,balanced,0.03344533344109853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,64,power_law_1.01,0.036339199542999266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,64,power_law_1.01,0.03697920143604279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,64,power_law_1.2,0.03560320138931274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,64,power_law_1.2,0.036236798763275145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,8,balanced,0.0726986676454544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,8,balanced,0.07278400162855785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,8,power_law_1.01,0.09463679790496826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,8,power_law_1.01,0.10123519897460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,8,power_law_1.2,0.09257599711418152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,1,8,power_law_1.2,0.0948736011981964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,16,1,balanced,0.05809600154558817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,16,1,balanced,0.06018666426340739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,16,1,power_law_1.01,0.05120000243186951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,16,1,power_law_1.01,0.05237119793891907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,16,1,power_law_1.2,0.04793600142002106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,16,1,power_law_1.2,0.048416000604629514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,2,1,balanced,0.17727466424306235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,2,1,balanced,0.17827733357747397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,2,1,power_law_1.01,0.14061440229415895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,2,1,power_law_1.01,0.14318079948425294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,2,1,power_law_1.2,0.13026560544967652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,2,1,power_law_1.2,0.13403520584106446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,32,1,balanced,0.04987200101216634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,32,1,balanced,0.049914668003718056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,32,1,power_law_1.01,0.04565120041370392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,32,1,power_law_1.01,0.046348801255226134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,32,1,power_law_1.2,0.04302079975605011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,32,1,power_law_1.2,0.04505600035190582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,4,1,balanced,0.11345066626866658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,4,1,balanced,0.11469866832097371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,4,1,power_law_1.01,0.09697920083999634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,4,1,power_law_1.01,0.09754239916801452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,4,1,power_law_1.2,0.08418560028076172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,4,1,power_law_1.2,0.08937600255012512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,8,1,balanced,0.08084799846013387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,8,1,balanced,0.08222400148709615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,8,1,power_law_1.01,0.06509439945220948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,8,1,power_law_1.01,0.066975998878479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,8,1,power_law_1.2,0.06333439946174621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,3072,1536,8,256,8,1,power_law_1.2,0.06345599889755249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,1,balanced,0.2550506591796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,1,balanced,0.25685866673787433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,1,power_law_1.01,0.24734079837799072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,1,power_law_1.01,0.25238399505615233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,1,power_law_1.2,0.2512255907058716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,1,power_law_1.2,0.25626239776611326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,2,balanced,0.17010132471720377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,2,balanced,0.17525867621103922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,2,power_law_1.01,0.1604864001274109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,2,power_law_1.01,0.16179200410842895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,2,power_law_1.2,0.16044800281524657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,2,power_law_1.2,0.17043839693069457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,4,balanced,0.11398399869600932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,4,balanced,0.11515200138092041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,4,power_law_1.01,0.11143039464950562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,4,power_law_1.01,0.11278079748153687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,4,power_law_1.2,0.11172480583190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,4,power_law_1.2,0.11370240449905396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,8,balanced,0.0888853371143341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,8,balanced,0.09455466270446777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,8,power_law_1.01,0.08600959777832032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,8,power_law_1.01,0.08684160113334656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,8,power_law_1.2,0.08634240031242371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,1,8,power_law_1.2,0.08718079924583436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,16,1,balanced,0.03579733272393545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,16,1,balanced,0.036943999429543815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,16,1,power_law_1.01,0.03408640027046204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,16,1,power_law_1.01,0.03633280098438263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,16,1,power_law_1.2,0.03522560000419617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,16,1,power_law_1.2,0.035411199927330016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,2,1,balanced,0.14874133467674255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,2,1,balanced,0.15818132956822714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,2,1,power_law_1.01,0.13844480514526367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,2,1,power_law_1.01,0.14130560159683228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,2,1,power_law_1.2,0.1394495964050293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,2,1,power_law_1.2,0.13979519605636598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,32,1,balanced,0.031167998909950256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,32,1,balanced,0.031194667021433514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,32,1,power_law_1.01,0.02865920066833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,32,1,power_law_1.01,0.029068800806999206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,32,1,power_law_1.2,0.02873600125312805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,32,1,power_law_1.2,0.02879360020160675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,4,1,balanced,0.08418132861455281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,4,1,balanced,0.0846613347530365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,4,1,power_law_1.01,0.08229119777679443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,4,1,power_law_1.01,0.08243839740753174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,4,1,power_law_1.2,0.08216320276260376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,4,1,power_law_1.2,0.0836736023426056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,8,1,balanced,0.05730666716893514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,8,1,balanced,0.05933333436648051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,8,1,power_law_1.01,0.05319039821624756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,8,1,power_law_1.01,0.053414398431777955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,8,1,power_law_1.2,0.05321599841117859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,14336,2,8,8,1,power_law_1.2,0.05475199818611145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,1,balanced,0.3975786765416463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,1,balanced,0.3976000150044759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,1,power_law_1.01,0.2199104070663452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,1,power_law_1.01,0.2233344078063965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,1,power_law_1.2,0.20396800041198732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,1,power_law_1.2,0.2092288017272949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,128,balanced,0.03379199902216593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,128,balanced,0.035445332527160645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,128,power_law_1.01,0.03371520042419433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,128,power_law_1.01,0.03418880105018616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,128,power_law_1.2,0.03342080116271973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,128,power_law_1.2,0.03399679958820343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,16,balanced,0.06018666426340739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,16,balanced,0.06062399844328562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,16,power_law_1.01,0.04737280011177063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,16,power_law_1.01,0.055795198678970336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,16,power_law_1.2,0.049516800045967105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,16,power_law_1.2,0.05252479910850525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,2,balanced,0.22574400901794434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,2,balanced,0.22587200005849203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,2,power_law_1.01,0.13781119585037233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,2,power_law_1.01,0.14049279689788818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,2,power_law_1.2,0.1399168014526367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,2,power_law_1.2,0.15000319480895996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,32,balanced,0.041482667128245033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,32,balanced,0.04389866689840952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,32,power_law_1.01,0.03935360014438629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,32,power_law_1.01,0.039647999405860904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,32,power_law_1.2,0.03816959857940674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,32,power_law_1.2,0.04073599874973297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,4,balanced,0.13798933227856955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,4,balanced,0.13809600472450256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,4,power_law_1.01,0.0834559977054596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,4,power_law_1.01,0.09669119715690613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,4,power_law_1.2,0.08679680228233337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,4,power_law_1.2,0.1051967978477478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,64,balanced,0.03661333272854487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,64,balanced,0.0373279998699824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,64,power_law_1.01,0.03531520068645477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,64,power_law_1.01,0.03559040129184723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,64,power_law_1.2,0.03492479920387268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,64,power_law_1.2,0.035180801153182985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,8,balanced,0.0835040012995402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,8,balanced,0.08460799853006999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,8,power_law_1.01,0.06350719928741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,8,power_law_1.01,0.07071359753608704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,8,power_law_1.2,0.06778240203857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,1,8,power_law_1.2,0.07073280215263367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,16,1,balanced,0.072202667593956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,16,1,balanced,0.07233066856861115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,16,1,power_law_1.01,0.04948480129241943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,16,1,power_law_1.01,0.050310397148132326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,16,1,power_law_1.2,0.048102399706840514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,16,1,power_law_1.2,0.04845440089702606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,2,1,balanced,0.22392000754674277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,2,1,balanced,0.2280693252881368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,2,1,power_law_1.01,0.13326719999313355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,2,1,power_law_1.01,0.1351807951927185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,2,1,power_law_1.2,0.12942080497741698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,2,1,power_law_1.2,0.12951040267944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,32,1,balanced,0.05816000203291575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,32,1,balanced,0.060122668743133545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,32,1,power_law_1.01,0.043321600556373595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,32,1,power_law_1.01,0.04438399970531463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,32,1,power_law_1.2,0.04179840087890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,32,1,power_law_1.2,0.0438975989818573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,4,1,balanced,0.14274666706720987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,4,1,balanced,0.14285866419474283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,4,1,power_law_1.01,0.08261759877204895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,4,1,power_law_1.01,0.08407040238380432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,4,1,power_law_1.2,0.07826560139656066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,4,1,power_law_1.2,0.07947520017623902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,8,1,balanced,0.09628267089525859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,8,1,balanced,0.0965119997660319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,8,1,power_law_1.01,0.06471040248870849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,8,1,power_law_1.01,0.06499199867248535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,8,1,power_law_1.2,0.06050559878349304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,1536,8,128,8,1,power_law_1.2,0.060844802856445314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,1,balanced,1.7690720558166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,1,balanced,1.770271937052409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,1,power_law_1.01,1.1562815666198731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,1,power_law_1.01,1.157254409790039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,1,power_law_1.2,1.0289728164672851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,1,power_law_1.2,1.066707229614258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,128,balanced,0.07026133437951405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,128,balanced,0.07055466870466869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,128,power_law_1.01,0.06458879709243774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,128,power_law_1.01,0.06503679752349853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,128,power_law_1.2,0.06338559985160827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,128,power_law_1.2,0.06504960060119629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,16,balanced,0.19088532527287802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,16,balanced,0.19248000780741373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,16,power_law_1.01,0.2124095916748047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,16,power_law_1.01,0.21380479335784913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,16,power_law_1.2,0.2119999885559082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,16,power_law_1.2,0.21242880821228027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,2,balanced,0.9228906631469727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,2,balanced,0.9242346286773682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,2,power_law_1.01,0.6588031768798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,2,power_law_1.01,0.6945727825164795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,2,power_law_1.2,0.61112961769104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,2,power_law_1.2,0.6598144054412842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,256,balanced,0.05792533357938131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,256,balanced,0.05823466678460439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,256,power_law_1.01,0.05621119737625122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,256,power_law_1.01,0.05623040199279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,256,power_law_1.2,0.05594239830970764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,256,power_law_1.2,0.05605760216712952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,32,balanced,0.14476799964904785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,32,balanced,0.14521066347757974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,32,power_law_1.01,0.14257279634475709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,32,power_law_1.01,0.1428928017616272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,32,power_law_1.2,0.13178240060806273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,32,power_law_1.2,0.13271039724349976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,4,balanced,0.5021173159281412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,4,balanced,0.5027946631113688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,4,power_law_1.01,0.44805121421813965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,4,power_law_1.01,0.4499328136444092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,4,power_law_1.2,0.4104640007019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,4,power_law_1.2,0.4609983921051025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,64,balanced,0.09071466326713562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,64,balanced,0.09086933732032776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,64,power_law_1.01,0.08579840064048767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,64,power_law_1.01,0.0861631989479065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,64,power_law_1.2,0.07772799730300903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,64,power_law_1.2,0.08216320276260376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,8,balanced,0.29389333724975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,8,balanced,0.2955999970436096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,8,power_law_1.01,0.3358400106430054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,8,power_law_1.01,0.3358527898788452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,8,power_law_1.2,0.334335994720459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,1,8,power_law_1.2,0.33696000576019286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,16,1,balanced,0.9246293703715006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,16,1,balanced,0.9259413083394369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,16,1,power_law_1.01,0.6047232151031494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,16,1,power_law_1.01,0.6178431987762452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,16,1,power_law_1.2,0.5568575859069824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,16,1,power_law_1.2,0.5609471797943115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,2,1,balanced,0.8998880386352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,2,1,balanced,0.9034720261891683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,2,1,power_law_1.01,0.601804780960083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,2,1,power_law_1.01,0.6117311954498291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,2,1,power_law_1.2,0.5386752128601074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,2,1,power_law_1.2,0.5495488166809082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,32,1,balanced,0.776629368464152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,32,1,balanced,0.7796853383382162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,32,1,power_law_1.01,0.5152959823608398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,32,1,power_law_1.01,0.5158336162567139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,32,1,power_law_1.2,0.46129918098449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,32,1,power_law_1.2,0.47670397758483884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,4,1,balanced,0.499232014020284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,4,1,balanced,0.5015413363774618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,4,1,power_law_1.01,0.33966081142425536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,4,1,power_law_1.01,0.3398144006729126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,4,1,power_law_1.2,0.31201920509338377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,4,1,power_law_1.2,0.31221120357513427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,8,1,balanced,0.2995199958483378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,8,1,balanced,0.32309865951538086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,8,1,power_law_1.01,0.21377279758453369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,8,1,power_law_1.01,0.21466240882873536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,8,1,power_law_1.2,0.19615360498428344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,4096,2688,22,512,8,1,power_law_1.2,0.19892480373382568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,1,balanced,0.4330559968948364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,1,balanced,0.43446401755015057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,1,power_law_1.01,0.42851839065551756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,1,power_law_1.01,0.4308608055114746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,1,power_law_1.2,0.42819838523864745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,1,power_law_1.2,0.4330304145812988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,2,balanced,0.24571200211842856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,2,balanced,0.2718240022659302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,2,power_law_1.01,0.24859519004821778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,2,power_law_1.01,0.2491136074066162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,2,power_law_1.2,0.23029758930206298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,2,power_law_1.2,0.24925439357757567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,4,balanced,0.167087992032369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,4,balanced,0.16857065757115683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,4,power_law_1.01,0.15588480234146118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,4,power_law_1.01,0.15808000564575195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,4,power_law_1.2,0.15762560367584227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,4,power_law_1.2,0.15953279733657838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,8,balanced,0.11177066961924235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,8,balanced,0.1165066659450531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,8,power_law_1.01,0.11214720010757447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,8,power_law_1.01,0.11239039897918701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,8,power_law_1.2,0.11262719631195069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,1,8,power_law_1.2,0.11266560554504394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,16,1,balanced,0.05741333464781443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,16,1,balanced,0.060085331400235496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,16,1,power_law_1.01,0.053337597846984865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,16,1,power_law_1.01,0.05373439788818359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,16,1,power_law_1.2,0.052825599908828735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,16,1,power_law_1.2,0.053862398862838744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,2,1,balanced,0.23029865821202597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,2,1,balanced,0.24047466119130453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,2,1,power_law_1.01,0.2233407974243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,2,1,power_law_1.01,0.2282111883163452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,2,1,power_law_1.2,0.21520640850067138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,2,1,power_law_1.2,0.22071681022644044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,32,1,balanced,0.03566933423280716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,32,1,balanced,0.03586133321126302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,32,1,power_law_1.01,0.03544960021972656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,32,1,power_law_1.01,0.03641600012779236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,32,1,power_law_1.2,0.03457280099391937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,32,1,power_law_1.2,0.03687680065631867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,4,1,balanced,0.13338667154312134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,4,1,balanced,0.1464853286743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,4,1,power_law_1.01,0.12685439586639405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,4,1,power_law_1.01,0.12829439640045165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,4,1,power_law_1.2,0.12949119806289672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,4,1,power_law_1.2,0.14369920492172242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,8,1,balanced,0.08507733543713887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,8,1,balanced,0.0897866686185201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,8,1,power_law_1.01,0.07500159740447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,8,1,power_law_1.01,0.0754368007183075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,8,1,power_law_1.2,0.07574399709701538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,16384,2,8,8,1,power_law_1.2,0.07591040134429931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,1,balanced,0.7870133717854818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,1,balanced,0.7943413257598877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,1,power_law_1.01,0.5753600120544433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,1,power_law_1.01,0.6080512046813965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,1,power_law_1.2,0.5457727909088135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,1,power_law_1.2,0.5483456134796143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,128,balanced,0.04072533299525579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,128,balanced,0.04162666698296865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,128,power_law_1.01,0.045158401131629944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,128,power_law_1.01,0.04723840057849884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,128,power_law_1.2,0.04661760032176972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,128,power_law_1.2,0.04678399860858917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,16,balanced,0.08611200253168742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,16,balanced,0.08717333277066548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,16,power_law_1.01,0.13966720104217528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,16,power_law_1.01,0.1398848056793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,16,power_law_1.2,0.1326591968536377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,16,power_law_1.2,0.13813120126724243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,2,balanced,0.41789865493774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,2,balanced,0.42347200711568195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,2,power_law_1.01,0.37389440536499025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,2,power_law_1.01,0.38161280155181887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,2,power_law_1.2,0.3420095920562744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,2,power_law_1.2,0.3461375951766968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,256,balanced,0.03984533250331879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,256,balanced,0.04037333279848099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,256,power_law_1.01,0.039027199149131775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,256,power_law_1.01,0.03940480053424835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,256,power_law_1.2,0.039743998646736146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,256,power_law_1.2,0.03983359932899475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,32,balanced,0.06419200201829274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,32,balanced,0.06650133430957794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,32,power_law_1.01,0.07688959836959838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,32,power_law_1.01,0.08005759716033936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,32,power_law_1.2,0.07155839800834655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,32,power_law_1.2,0.07948160171508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,4,balanced,0.23622934023539224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,4,balanced,0.24043200413386026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,4,power_law_1.01,0.23542399406433107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,4,power_law_1.01,0.2542975902557373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,4,power_law_1.2,0.24368000030517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,4,power_law_1.2,0.2611840009689331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,64,balanced,0.049653331438700356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,64,balanced,0.04987733562787374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,64,power_law_1.01,0.06109439730644226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,64,power_law_1.01,0.0631168007850647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,64,power_law_1.2,0.05845119953155518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,64,power_law_1.2,0.06318079829216003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,8,balanced,0.14135467012723288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,8,balanced,0.1444533367951711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,8,power_law_1.01,0.18072960376739503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,8,power_law_1.01,0.21252479553222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,8,power_law_1.2,0.1839679956436157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,1,8,power_law_1.2,0.21585280895233155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,16,1,balanced,0.10114666819572449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,16,1,balanced,0.10116266210873921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,16,1,power_law_1.01,0.0827455997467041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,16,1,power_law_1.01,0.08361600041389465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,16,1,power_law_1.2,0.07838720083236694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,16,1,power_law_1.2,0.07875840067863464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,2,1,balanced,0.41065601507822674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,2,1,balanced,0.41070934136708576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,2,1,power_law_1.01,0.3179392099380493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,2,1,power_law_1.01,0.31855359077453616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,2,1,power_law_1.2,0.2813375949859619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,2,1,power_law_1.2,0.2851968050003052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,32,1,balanced,0.0879200001557668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,32,1,balanced,0.08880533774693807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,32,1,power_law_1.01,0.07466880083084107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,32,1,power_law_1.01,0.07518079876899719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,32,1,power_law_1.2,0.06906239986419678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,32,1,power_law_1.2,0.0716480016708374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,4,1,balanced,0.23908267418543497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,4,1,balanced,0.24071999390920004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,4,1,power_law_1.01,0.1872383952140808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,4,1,power_law_1.01,0.1873088002204895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,4,1,power_law_1.2,0.1743872046470642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,4,1,power_law_1.2,0.17564799785614013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,8,1,balanced,0.15033066272735596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,8,1,balanced,0.1509119967619578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,8,1,power_law_1.01,0.11510399580001832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,8,1,power_law_1.01,0.11601279973983765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,8,1,power_law_1.2,0.1102336049079895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2048,8,256,8,1,power_law_1.2,0.11175680160522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,1,balanced,0.9715840021769205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,1,balanced,0.9735573132832845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,1,power_law_1.01,0.5818048000335694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,1,power_law_1.01,0.5848320007324219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,1,power_law_1.2,0.524563217163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,1,power_law_1.2,0.5323135852813721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,16,balanced,0.10109333197275798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,16,balanced,0.10155733426411946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,16,power_law_1.01,0.09575039744377137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,16,power_law_1.01,0.1040768027305603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,16,power_law_1.2,0.09287040233612061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,16,power_law_1.2,0.09473279714584351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,2,balanced,0.5076853434244791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,2,balanced,0.5106559991836548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,2,power_law_1.01,0.3327167987823486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,2,power_law_1.01,0.3650496006011963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,2,power_law_1.2,0.3366528034210205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,2,power_law_1.2,0.3380223989486694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,32,balanced,0.06980800131956737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,32,balanced,0.0701386680205663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,32,power_law_1.01,0.06758400201797485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,32,power_law_1.01,0.0704255998134613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,32,power_law_1.2,0.06610559821128845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,32,power_law_1.2,0.06735360026359558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,4,balanced,0.2779573400815328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,4,balanced,0.291978657245636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,4,power_law_1.01,0.23297278881072997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,4,power_law_1.01,0.2380671977996826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,4,power_law_1.2,0.18307199478149414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,4,power_law_1.2,0.2044287919998169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,8,balanced,0.17045332988103232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,8,balanced,0.17056532700856528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,8,power_law_1.01,0.13905919790267945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,8,power_law_1.01,0.15889279842376708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,8,power_law_1.2,0.11586560010910034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,1,8,power_law_1.2,0.17072000503540039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,16,1,balanced,0.12096533179283142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,16,1,balanced,0.12129599849383037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,16,1,power_law_1.01,0.08510720133781433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,16,1,power_law_1.01,0.08514559864997864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,16,1,power_law_1.2,0.07994239926338195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,16,1,power_law_1.2,0.08031359910964966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,2,1,balanced,0.49934399127960205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,2,1,balanced,0.5021760066350301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,2,1,power_law_1.01,0.3067967891693115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,2,1,power_law_1.01,0.3138816118240356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,2,1,power_law_1.2,0.276307201385498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,2,1,power_law_1.2,0.28440959453582765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,32,1,balanced,0.09283199906349182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,32,1,balanced,0.09331199526786804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,32,1,power_law_1.01,0.06991999745368957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,32,1,power_law_1.01,0.07047680020332336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,32,1,power_law_1.2,0.06507520079612732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,32,1,power_law_1.2,0.06700800061225891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,4,1,balanced,0.2789173324902852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,4,1,balanced,0.28032533327738446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,4,1,power_law_1.01,0.17613439559936522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,4,1,power_law_1.01,0.180511999130249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,4,1,power_law_1.2,0.16587519645690918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,4,1,power_law_1.2,0.1669312000274658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,8,1,balanced,0.18533867597579956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,8,1,balanced,0.18593599398930868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,8,1,power_law_1.01,0.11544959545135498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,8,1,power_law_1.01,0.11923840045928955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,8,1,power_law_1.2,0.10855040550231934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,6144,2560,8,160,8,1,power_law_1.2,0.10974080562591552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,1,balanced,0.9160959720611572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,1,balanced,0.918293317159017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,1,power_law_1.01,0.6913023948669433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,1,power_law_1.01,0.7051648139953614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,1,power_law_1.2,0.628704023361206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,1,power_law_1.2,0.641324806213379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,128,balanced,0.04305600126584371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,128,balanced,0.04372799893220266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,128,power_law_1.01,0.051507198810577394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,128,power_law_1.01,0.05300480127334595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,128,power_law_1.2,0.05258240103721619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,128,power_law_1.2,0.05449600219726562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,16,balanced,0.09771200021107991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,16,balanced,0.09822932879130046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,16,power_law_1.01,0.15186560153961182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,16,power_law_1.01,0.1544000029563904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,16,power_law_1.2,0.1397055983543396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,16,power_law_1.2,0.1522495985031128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,2,balanced,0.48286934693654376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,2,balanced,0.48336533705393475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,2,power_law_1.01,0.3918463945388794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,2,power_law_1.01,0.436352014541626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,2,power_law_1.2,0.40091519355773925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,2,power_law_1.2,0.42405118942260744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,256,balanced,0.04373333354791006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,256,balanced,0.04381333291530609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,256,power_law_1.01,0.042508798837661746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,256,power_law_1.01,0.04258559942245484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,256,power_law_1.2,0.04229120016098022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,256,power_law_1.2,0.043935999274253845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,32,balanced,0.07031466563542683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,32,balanced,0.07107200225194295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,32,power_law_1.01,0.08651520013809204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,32,power_law_1.01,0.09342719912528992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,32,power_law_1.2,0.08102399706840516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,32,power_law_1.2,0.08234239816665649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,4,balanced,0.2770293354988098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,4,balanced,0.29201600948969525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,4,power_law_1.01,0.2789760112762451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,4,power_law_1.01,0.291596794128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,4,power_law_1.2,0.2610111951828003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,4,power_law_1.2,0.2819904088973999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,64,balanced,0.053930665055910744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,64,balanced,0.05420800050099691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,64,power_law_1.01,0.06354560256004334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,64,power_law_1.01,0.06723200082778931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,64,power_law_1.2,0.061612802743911746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,64,power_law_1.2,0.06225919723510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,8,balanced,0.1523146629333496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,8,balanced,0.16086933016777039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,8,power_law_1.01,0.22122879028320314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,8,power_law_1.01,0.23180799484252929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,8,power_law_1.2,0.23017599582672119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,1,8,power_law_1.2,0.24238719940185546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,16,1,balanced,0.11377066373825073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,16,1,balanced,0.11714667081832886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,16,1,power_law_1.01,0.09376639723777772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,16,1,power_law_1.01,0.0957759976387024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,16,1,power_law_1.2,0.08799999952316284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,16,1,power_law_1.2,0.08880640268325805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,2,1,balanced,0.4748266537984212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,2,1,balanced,0.47863467534383136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,2,1,power_law_1.01,0.3578495979309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,2,1,power_law_1.01,0.3655359983444214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,2,1,power_law_1.2,0.3292992115020752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,2,1,power_law_1.2,0.34714879989624026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,32,1,balanced,0.09735467036565144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,32,1,balanced,0.09770133097966512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,32,1,power_law_1.01,0.08273919820785522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,32,1,power_law_1.01,0.08293120265007019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,32,1,power_law_1.2,0.07825279831886292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,32,1,power_law_1.2,0.07864959836006165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,4,1,balanced,0.27474133173624676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,4,1,balanced,0.27502934137980145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,4,1,power_law_1.01,0.2092223882675171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,4,1,power_law_1.01,0.2130687952041626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,4,1,power_law_1.2,0.19727360010147094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,4,1,power_law_1.2,0.20151679515838622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,8,1,balanced,0.1697333256403605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,8,1,balanced,0.1748960018157959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,8,1,power_law_1.01,0.13619199991226197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,8,1,power_law_1.01,0.14369280338287355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,8,1,power_law_1.2,0.12364799976348877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,256,8,1,power_law_1.2,0.1256832003593445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,1,balanced,0.92685333887736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,1,balanced,0.9270293712615967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,1,power_law_1.01,0.8292415618896485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,1,power_law_1.01,0.8407551765441894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,1,power_law_1.2,0.7461056232452392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,1,power_law_1.2,0.7549439907073975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,128,balanced,0.043680002291997276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,128,balanced,0.043935999274253845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,128,power_law_1.01,0.05988479852676391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,128,power_law_1.01,0.060102397203445436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,128,power_law_1.2,0.05681279897689819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,128,power_law_1.2,0.05917440056800842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,16,balanced,0.09815466403961182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,16,balanced,0.09880000352859497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,16,power_law_1.01,0.20573439598083496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,16,power_law_1.01,0.2067199945449829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,16,power_law_1.2,0.20591359138488768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,16,power_law_1.2,0.2076864004135132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,2,balanced,0.4866559902826945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,2,balanced,0.4883466561635335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,2,power_law_1.01,0.5151807785034179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,2,power_law_1.01,0.5303808212280273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,2,power_law_1.2,0.4843711853027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,2,power_law_1.2,0.49793281555175783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,32,balanced,0.07044800122578938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,32,balanced,0.07046933472156525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,32,power_law_1.01,0.136518394947052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,32,power_law_1.01,0.1379968047142029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,32,power_law_1.2,0.13608959913253785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,32,power_law_1.2,0.13974399566650392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,4,balanced,0.2693493366241455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,4,balanced,0.2698240081469218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,4,power_law_1.01,0.3654911994934082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,4,power_law_1.01,0.3684159994125366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,4,power_law_1.2,0.33535358905792234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,4,power_law_1.2,0.3562304019927979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,64,balanced,0.0537120004494985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,64,balanced,0.053717335065205894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,64,power_law_1.01,0.07902079820632935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,64,power_law_1.01,0.08117120265960694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,64,power_law_1.2,0.0770367980003357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,64,power_law_1.2,0.07856000065803528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,8,balanced,0.15404799580574036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,8,balanced,0.15708800156911215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,8,power_law_1.01,0.2744064092636108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,8,power_law_1.01,0.2870847940444946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,8,power_law_1.2,0.2703808069229126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,1,8,power_law_1.2,0.3096191883087158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,16,1,balanced,0.11347732941309611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,16,1,balanced,0.11522133151690166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,16,1,power_law_1.01,0.1050495982170105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,16,1,power_law_1.01,0.10539519786834717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,16,1,power_law_1.2,0.09778559803962708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,16,1,power_law_1.2,0.09941759705543518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,2,1,balanced,0.4729173183441162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,2,1,balanced,0.4734666744867961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,2,1,power_law_1.01,0.41303038597106934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,2,1,power_law_1.01,0.4331711769104004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,2,1,power_law_1.2,0.38015360832214357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,2,1,power_law_1.2,0.38736639022827146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,32,1,balanced,0.0969493289788564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,32,1,balanced,0.09776533643404643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,32,1,power_law_1.01,0.09139840006828308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,32,1,power_law_1.01,0.09287679791450501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,32,1,power_law_1.2,0.08634880185127258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,32,1,power_law_1.2,0.08686720132827759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,4,1,balanced,0.2723093430201213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,4,1,balanced,0.2735840082168579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,4,1,power_law_1.01,0.2344575881958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,4,1,power_law_1.01,0.2443392038345337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,4,1,power_law_1.2,0.22239999771118163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,4,1,power_law_1.2,0.22645120620727538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,8,1,balanced,0.16949333747227988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,8,1,balanced,0.1718719998995463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,8,1,power_law_1.01,0.1548095941543579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,8,1,power_law_1.01,0.15568000078201294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,8,1,power_law_1.2,0.14752639532089235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16,7168,2048,8,384,8,1,power_law_1.2,0.14997119903564454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,1,balanced,0.14761066436767578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,1,balanced,0.14827199776967367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,1,power_law_1.01,0.14090240001678467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,1,power_law_1.01,0.14287999868392945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,1,power_law_1.2,0.14115840196609497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,1,power_law_1.2,0.1433087944984436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,128,balanced,0.047930667797724404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,128,balanced,0.048512001832326256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,128,power_law_1.01,0.04723199903964996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,128,power_law_1.01,0.04760960042476654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,128,power_law_1.2,0.04749439954757691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,128,power_law_1.2,0.04790399968624115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,16,balanced,0.05008000135421753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,16,balanced,0.05194133520126343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,16,power_law_1.01,0.04896000027656555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,16,power_law_1.01,0.049318400025367734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,16,power_law_1.2,0.04896000027656555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,16,power_law_1.2,0.049158400297164916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,2,balanced,0.09879466891288757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,2,balanced,0.09935999910036723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,2,power_law_1.01,0.09477760195732117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,2,power_law_1.01,0.09580159783363343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,2,power_law_1.2,0.09587839841842652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,2,power_law_1.2,0.09650560021400452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,32,balanced,0.04920533299446106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,32,balanced,0.05012266834576925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,32,power_law_1.01,0.04748159945011139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,32,power_law_1.01,0.04798080027103424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,32,power_law_1.2,0.04801279902458191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,32,power_law_1.2,0.048102399706840514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,4,balanced,0.07415999968846639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,4,balanced,0.07572266459465027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,4,power_law_1.01,0.07146880030632019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,4,power_law_1.01,0.07225599884986877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,4,power_law_1.2,0.07222399711608887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,4,power_law_1.2,0.0738048017024994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,64,balanced,0.04779199759165446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,64,balanced,0.04791999856630961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,64,power_law_1.01,0.047065600752830505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,64,power_law_1.01,0.04711039960384369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,64,power_law_1.2,0.04743039906024933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,64,power_law_1.2,0.04744960069656372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,8,balanced,0.05348266661167145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,8,balanced,0.0540533314148585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,8,power_law_1.01,0.05249279737472534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,8,power_law_1.01,0.05406079888343811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,8,power_law_1.2,0.05406079888343811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,1,8,power_law_1.2,0.05429760217666626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,2,1,balanced,0.09698667128880818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,2,1,balanced,0.09896533687909444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,2,1,power_law_1.01,0.09390079975128174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,2,1,power_law_1.01,0.09404799938201905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,2,1,power_law_1.2,0.095769602060318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,2,1,power_law_1.2,0.09605759978294373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,4,1,balanced,0.07668266693751018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,4,1,balanced,0.07686399916807811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,4,1,power_law_1.01,0.07201279997825623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,4,1,power_law_1.01,0.07354239821434021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,4,1,power_law_1.2,0.07246720194816589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2048,768,8,128,4,1,power_law_1.2,0.07428479790687562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,1,balanced,0.3569440046946208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,1,balanced,0.35731200377146405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,1,power_law_1.01,0.3256767988204956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,1,power_law_1.01,0.32943360805511473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,1,power_law_1.2,0.33566720485687257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,1,power_law_1.2,0.336083197593689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,128,balanced,0.06631466746330261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,128,balanced,0.06639466683069865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,128,power_law_1.01,0.06409599781036376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,128,power_law_1.01,0.0642624020576477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,128,power_law_1.2,0.06401280164718628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,128,power_law_1.2,0.06421120166778564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,16,balanced,0.0769706666469574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,16,balanced,0.07867733140786488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,16,power_law_1.01,0.07371519804000855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,16,power_law_1.01,0.07496320009231568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,16,power_law_1.2,0.07370880246162415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,16,power_law_1.2,0.07530879974365234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,2,balanced,0.21652267376581827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,2,balanced,0.21663467089335123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,2,power_law_1.01,0.19874559640884398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,2,power_law_1.01,0.20524799823760986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,2,power_law_1.2,0.19952640533447266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,2,power_law_1.2,0.20158720016479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,32,balanced,0.06633066634337108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,32,balanced,0.06819200019041698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,32,power_law_1.01,0.06586880087852479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,32,power_law_1.01,0.06709120273590088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,32,power_law_1.2,0.06670719981193543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,32,power_law_1.2,0.06725760102272034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,4,balanced,0.1420906682809194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,4,balanced,0.14247999588648477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,4,power_law_1.01,0.13006080389022828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,4,power_law_1.01,0.1327296018600464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,4,power_law_1.2,0.13427200317382812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,4,power_law_1.2,0.13494399785995484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,64,balanced,0.06526400148868561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,64,balanced,0.06609066824118297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,64,power_law_1.01,0.06369280219078063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,64,power_law_1.01,0.06403840184211732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,64,power_law_1.2,0.06401280164718628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,64,power_law_1.2,0.06469119787216186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,8,balanced,0.10332799951235454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,8,balanced,0.10449066758155823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,8,power_law_1.01,0.0956928014755249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,8,power_law_1.01,0.0974016010761261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,8,power_law_1.2,0.10087679624557495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,1,8,power_law_1.2,0.10120960474014282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,16,1,balanced,0.32629867394765216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,16,1,balanced,0.32683199644088745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,16,1,power_law_1.01,0.29500160217285154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,16,1,power_law_1.01,0.2983871936798096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,16,1,power_law_1.2,0.3018496036529541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,16,1,power_law_1.2,0.30288000106811525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,2,1,balanced,0.20984532435735068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,2,1,balanced,0.2100586692492167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,2,1,power_law_1.01,0.19218560457229614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,2,1,power_law_1.01,0.19408639669418334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,2,1,power_law_1.2,0.1906559944152832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,2,1,power_law_1.2,0.19298559427261353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,32,1,balanced,0.2797333399454753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,32,1,balanced,0.28199466069539386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,32,1,power_law_1.01,0.2470911979675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,32,1,power_law_1.01,0.2546880006790161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,32,1,power_law_1.2,0.2606911897659302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,32,1,power_law_1.2,0.2620800018310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,4,1,balanced,0.13668800393740335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,4,1,balanced,0.1366986632347107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,4,1,power_law_1.01,0.12741119861602784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,4,1,power_law_1.01,0.12892160415649415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,4,1,power_law_1.2,0.13043839931488038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,4,1,power_law_1.2,0.13057279586791992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,8,1,balanced,0.4229653278986613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,8,1,balanced,0.42390934626261395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,8,1,power_law_1.01,0.3817408084869385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,8,1,power_law_1.01,0.3834304094314575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,8,1,power_law_1.2,0.3929663896560669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,2688,1856,6,128,8,1,power_law_1.2,0.3961087942123413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,1,balanced,0.6053066651026408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,1,balanced,0.6065920193990072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,1,power_law_1.01,0.5185152053833008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,1,power_law_1.01,0.5203839778900147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,1,power_law_1.2,0.5152128219604493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,1,power_law_1.2,0.5226943969726563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,128,balanced,0.09691199660301208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,128,balanced,0.09861333171526591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,128,power_law_1.01,0.09616000056266785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,128,power_law_1.01,0.09621120095252991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,128,power_law_1.2,0.09557759761810303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,128,power_law_1.2,0.09617279767990113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,16,balanced,0.13065600395202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,16,balanced,0.1320746640364329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,16,power_law_1.01,0.11729919910430908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,16,power_law_1.01,0.12214399576187134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,16,power_law_1.2,0.12095359563827515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,16,power_law_1.2,0.1224128007888794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,2,balanced,0.35493866602579754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,2,balanced,0.35631465911865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,2,power_law_1.01,0.304640007019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,2,power_law_1.01,0.31705598831176757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,2,power_law_1.2,0.3053760051727295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,2,power_law_1.2,0.3084671974182129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,256,balanced,0.0969493289788564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,256,balanced,0.09885866443316142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,256,power_law_1.01,0.0959231972694397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,256,power_law_1.01,0.09653120040893555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,256,power_law_1.2,0.09601920247077941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,256,power_law_1.2,0.0961471974849701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,32,balanced,0.10713600118954976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,32,balanced,0.10727999607721965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,32,power_law_1.01,0.1039423942565918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,32,power_law_1.01,0.10485119819641113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,32,power_law_1.2,0.10535039901733398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,32,power_law_1.2,0.1060863971710205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,4,balanced,0.22944533824920654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,4,balanced,0.23004800081253052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,4,power_law_1.01,0.21299200057983397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,4,power_law_1.01,0.21967360973358155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,4,power_law_1.2,0.20763518810272216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,4,power_law_1.2,0.2104192018508911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,64,balanced,0.09916266798973083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,64,balanced,0.09937066833178203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,64,power_law_1.01,0.09836800098419189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,64,power_law_1.01,0.09886080026626587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,64,power_law_1.2,0.09786880016326904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,64,power_law_1.2,0.09811840057373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,8,balanced,0.16326399644215903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,8,balanced,0.1646613379319509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,8,power_law_1.01,0.1499071955680847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,8,power_law_1.01,0.1522879958152771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,8,power_law_1.2,0.1504256010055542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,1,8,power_law_1.2,0.1515071988105774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,16,1,balanced,0.1338879962762197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,16,1,balanced,0.13421866297721863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,16,1,power_law_1.01,0.11384960412979125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,16,1,power_law_1.01,0.11388159990310669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,16,1,power_law_1.2,0.11514879465103149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,16,1,power_law_1.2,0.11599999666213989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,2,1,balanced,0.34089601039886475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,2,1,balanced,0.3415093421936035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,2,1,power_law_1.01,0.29354879856109617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,2,1,power_law_1.01,0.29774720668792726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,2,1,power_law_1.2,0.29747838973999025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,2,1,power_law_1.2,0.29750399589538573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,32,1,balanced,0.11336533228556316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,32,1,balanced,0.11405866344769795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,32,1,power_law_1.01,0.10355199575424194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,32,1,power_law_1.01,0.10404479503631592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,32,1,power_law_1.2,0.10362240076065063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,32,1,power_law_1.2,0.10443520545959473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,4,1,balanced,0.216538667678833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,4,1,balanced,0.21756800015767416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,4,1,power_law_1.01,0.18647680282592774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,4,1,power_law_1.01,0.18829439878463744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,4,1,power_law_1.2,0.18903039693832396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,4,1,power_law_1.2,0.18984960317611693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,8,1,balanced,0.15613866845766702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,8,1,balanced,0.15666666626930237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,8,1,power_law_1.01,0.14127999544143677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,8,1,power_law_1.01,0.14396799802780152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,8,1,power_law_1.2,0.141702401638031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,3072,1536,8,256,8,1,power_law_1.2,0.1442752003669739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,1,balanced,0.2858293255170186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,1,balanced,0.2865920066833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,1,power_law_1.01,0.3028543949127197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,1,power_law_1.01,0.3214272022247314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,1,power_law_1.2,0.3092927932739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,1,power_law_1.2,0.3118079900741577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,2,balanced,0.20390399297078451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,2,balanced,0.20544000466664633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,2,power_law_1.01,0.21668479442596436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,2,power_law_1.01,0.21747839450836182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,2,power_law_1.2,0.22381439208984374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,2,power_law_1.2,0.2261631965637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,4,balanced,0.1586240033308665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,4,balanced,0.15929599603017172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,4,power_law_1.01,0.16299519538879395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,4,power_law_1.01,0.18194559812545777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,4,power_law_1.2,0.17669119834899902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,4,power_law_1.2,0.17831679582595825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,8,balanced,0.1436906655629476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,8,balanced,0.14455466469128928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,8,power_law_1.01,0.1503999948501587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,8,power_law_1.01,0.15290240049362183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,8,power_law_1.2,0.15237760543823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,1,8,power_law_1.2,0.15434880256652833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,16,1,balanced,0.049914668003718056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,16,1,balanced,0.04996799925963084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,16,1,power_law_1.01,0.055232000350952146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,16,1,power_law_1.01,0.05568000078201294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,16,1,power_law_1.2,0.0548799991607666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,16,1,power_law_1.2,0.055219197273254396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,2,1,balanced,0.17086933056513467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,2,1,balanced,0.1725920041402181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,2,1,power_law_1.01,0.17108479738235474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,2,1,power_law_1.01,0.1762879967689514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,2,1,power_law_1.2,0.17043839693069457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,2,1,power_law_1.2,0.17127039432525634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,32,1,balanced,0.039887999494870506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,32,1,balanced,0.041519999504089355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,32,1,power_law_1.01,0.040089601278305055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,32,1,power_law_1.01,0.04032639861106872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,32,1,power_law_1.2,0.04073599874973297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,32,1,power_law_1.2,0.04100480079650879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,4,1,balanced,0.10812266667683919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,4,1,balanced,0.1086186667283376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,4,1,power_law_1.01,0.10614399909973145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,4,1,power_law_1.01,0.10635520219802856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,4,1,power_law_1.2,0.10490239858627319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,4,1,power_law_1.2,0.10699520111083985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,8,1,balanced,0.06919466455777486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,8,1,balanced,0.07237866520881653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,8,1,power_law_1.01,0.06892160177230836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,8,1,power_law_1.2,0.06936320066452026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,14336,2,8,8,1,power_law_1.2,0.06936960220336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,1,balanced,0.4209493398666382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,1,balanced,0.4232586622238159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,1,power_law_1.01,0.39799039363861083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,1,power_law_1.01,0.40799360275268554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,1,power_law_1.2,0.4116799831390381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,1,power_law_1.2,0.41524481773376465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,128,balanced,0.07260266443093617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,128,balanced,0.07323200007279713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,128,power_law_1.01,0.07223039865493774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,128,power_law_1.01,0.07246720194816589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,128,power_law_1.2,0.0726527988910675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,128,power_law_1.2,0.0737280011177063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,16,balanced,0.08942932883898418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,16,balanced,0.09087466200192769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,16,power_law_1.01,0.08762879967689514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,16,power_law_1.01,0.0883072018623352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,16,power_law_1.2,0.08809599876403809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,16,power_law_1.2,0.08810240030288696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,2,balanced,0.25271467367808026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,2,balanced,0.25272534290949505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,2,power_law_1.01,0.2424448013305664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,2,power_law_1.01,0.24463999271392822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,2,power_law_1.2,0.2405184030532837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,2,power_law_1.2,0.24691200256347656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,32,balanced,0.07838933169841766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,32,balanced,0.08055999875068665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,32,power_law_1.01,0.0760320007801056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,32,power_law_1.01,0.07689599990844727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,32,power_law_1.2,0.07756159901618957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,32,power_law_1.2,0.07864959836006165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,4,balanced,0.16007467110951742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,4,balanced,0.16062933206558228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,4,power_law_1.01,0.14859520196914672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,4,power_law_1.01,0.1568511962890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,4,power_law_1.2,0.15164159536361693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,4,power_law_1.2,0.15383039712905883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,64,balanced,0.07442133128643036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,64,balanced,0.07453333338101704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,64,power_law_1.01,0.0729088008403778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,64,power_law_1.01,0.07355520129203796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,64,power_law_1.2,0.07319039702415467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,64,power_law_1.2,0.07319679856300354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,8,balanced,0.11820266644159953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,8,balanced,0.11894399921099345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,8,power_law_1.01,0.1126207947731018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,8,power_law_1.01,0.11320960521697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,8,power_law_1.2,0.11291520595550537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,1,8,power_law_1.2,0.11667840480804444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,16,1,balanced,0.09983999530474345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,16,1,balanced,0.10117333134015401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,16,1,power_law_1.01,0.09671679735183716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,16,1,power_law_1.01,0.09743360280990601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,16,1,power_law_1.2,0.09696639776229858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,16,1,power_law_1.2,0.09733759760856628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,2,1,balanced,0.24497600396474203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,2,1,balanced,0.24527466297149658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,2,1,power_law_1.01,0.2383039951324463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,2,1,power_law_1.01,0.24062080383300782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,2,1,power_law_1.2,0.23582720756530762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,2,1,power_law_1.2,0.24252159595489503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,32,1,balanced,0.08727999528249104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,32,1,balanced,0.08860799670219421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,32,1,power_law_1.01,0.08599039912223816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,32,1,power_law_1.01,0.08637440204620361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,32,1,power_law_1.2,0.08548480272293091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,32,1,power_law_1.2,0.08672000169754028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,4,1,balanced,0.15730667114257812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,4,1,balanced,0.15745066603024802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,4,1,power_law_1.01,0.14996479749679564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,4,1,power_law_1.01,0.15143040418624878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,4,1,power_law_1.2,0.15178240537643434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,4,1,power_law_1.2,0.15479040145874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,8,1,balanced,0.11648533741633098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,8,1,balanced,0.11741866668065389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,8,1,power_law_1.01,0.11240960359573364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,8,1,power_law_1.01,0.11256320476531982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,8,1,power_law_1.2,0.11326080560684204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,1536,8,128,8,1,power_law_1.2,0.11501439809799194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,1,balanced,2.643162727355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,1,balanced,2.6536426544189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,1,power_law_1.01,2.3742464065551756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,1,power_law_1.01,2.402579116821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,1,power_law_1.2,2.4038719177246093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,1,power_law_1.2,2.437548828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,128,balanced,0.27748799324035645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,128,balanced,0.27934932708740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,128,power_law_1.01,0.2761152029037476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,128,power_law_1.01,0.27705600261688235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,128,power_law_1.2,0.27639040946960447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,128,power_law_1.2,0.27809278964996337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,16,balanced,0.43649065494537354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,16,balanced,0.43797866503397626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,16,power_law_1.01,0.41826558113098145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,16,power_law_1.01,0.42698240280151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,16,power_law_1.2,0.41717119216918946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,16,power_law_1.2,0.42250881195068357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,2,balanced,1.4692106246948242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,2,balanced,1.4778025945027669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,2,power_law_1.01,1.3175488471984864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,2,power_law_1.01,1.3206208229064942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,2,power_law_1.2,1.364896011352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,2,power_law_1.2,1.3661184310913086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,256,balanced,0.2747093240420024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,256,balanced,0.2750506599744161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,256,power_law_1.01,0.27239038944244387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,256,power_law_1.01,0.2725888013839722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,256,power_law_1.2,0.2719615936279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,256,power_law_1.2,0.272377610206604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,32,balanced,0.35026665528615314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,32,balanced,0.35178132851918537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,32,power_law_1.01,0.3466815948486328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,32,power_law_1.01,0.3473088026046753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,32,power_law_1.2,0.344051194190979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,32,power_law_1.2,0.348089599609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,4,balanced,0.8835946718851725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,4,balanced,0.8878026803334554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,4,power_law_1.01,0.8259136199951171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,4,power_law_1.01,0.8499967575073242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,4,power_law_1.2,0.8238207817077636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,4,power_law_1.2,0.8315263748168945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,64,balanced,0.2996533314387004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,64,balanced,0.30005866289138794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,64,power_law_1.01,0.2947776079177856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,64,power_law_1.01,0.29694719314575196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,64,power_law_1.2,0.2948607921600342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,64,power_law_1.2,0.29510400295257566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,8,balanced,0.5868159929911295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,8,balanced,0.5878560145696005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,8,power_law_1.01,0.5491072177886963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,8,power_law_1.01,0.5528575897216796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,8,power_law_1.2,0.5486591815948486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,1,8,power_law_1.2,0.5598144054412841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,16,1,balanced,2.279930591583252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,16,1,balanced,2.2806666692097983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,16,1,power_law_1.01,2.0231296539306642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,16,1,power_law_1.01,2.041420745849609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,16,1,power_law_1.2,2.0652671813964845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,16,1,power_law_1.2,2.072800064086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,2,1,balanced,1.3867146174112956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,2,1,balanced,1.4314932823181152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,2,1,power_law_1.01,1.2395071983337402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,2,1,power_law_1.01,1.2498687744140624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,2,1,power_law_1.2,1.2533439636230468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,2,1,power_law_1.2,1.2693696022033691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,32,1,balanced,1.7678720156351726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,32,1,balanced,1.7684213320414226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,32,1,power_law_1.01,1.5818623542785644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,32,1,power_law_1.01,1.6028928756713867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,32,1,power_law_1.2,1.612396812438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,32,1,power_law_1.2,1.6257728576660155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,4,1,balanced,0.7893919944763184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,4,1,balanced,0.7904906272888184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,4,1,power_law_1.01,0.7142848014831543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,4,1,power_law_1.01,0.7157055854797363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,4,1,power_law_1.2,0.7219520092010498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,4,1,power_law_1.2,0.7274112224578857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,8,1,balanced,0.4901813268661499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,8,1,balanced,0.4925653139750163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,8,1,power_law_1.01,0.4438079833984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,8,1,power_law_1.01,0.4529407978057861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,8,1,power_law_1.2,0.4570943832397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,4096,2688,22,512,8,1,power_law_1.2,0.4598080158233643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,1,balanced,0.43376000722249347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,1,balanced,0.4368213415145874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,1,power_law_1.01,0.5435776233673095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,1,power_law_1.01,0.5540095806121826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,1,power_law_1.2,0.5092031955718994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,1,power_law_1.2,0.5352320194244384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,2,balanced,0.27793065706888836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,2,balanced,0.2821279962857564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,2,power_law_1.01,0.30275840759277345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,2,power_law_1.01,0.31668479442596437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,2,power_law_1.2,0.3018239974975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,2,power_law_1.2,0.31157119274139405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,4,balanced,0.20368534326553345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,4,balanced,0.2039146622021993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,4,power_law_1.01,0.21375999450683594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,4,power_law_1.01,0.23395841121673583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,4,power_law_1.2,0.2212224006652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,4,power_law_1.2,0.23916800022125245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,8,balanced,0.17519466082255045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,8,balanced,0.1757813294728597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,8,power_law_1.01,0.18540799617767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,8,power_law_1.01,0.19352320432662964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,8,power_law_1.2,0.18988159894943238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,1,8,power_law_1.2,0.19174400568008423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,16,1,balanced,0.07441066702206929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,16,1,balanced,0.07646400233109792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,16,1,power_law_1.01,0.07545599937438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,16,1,power_law_1.01,0.07809919714927674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,16,1,power_law_1.2,0.07675520181655884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,16,1,power_law_1.2,0.07779200077056884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,2,1,balanced,0.2482186754544576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,2,1,balanced,0.24990399678548178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,2,1,power_law_1.01,0.2753216028213501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,2,1,power_law_1.01,0.2877311944961548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,2,1,power_law_1.2,0.2789952039718628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,2,1,power_law_1.2,0.2794303894042969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,32,1,balanced,0.055973331133524575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,32,1,balanced,0.056943997740745544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,32,1,power_law_1.01,0.061740797758102414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,32,1,power_law_1.01,0.06185600161552429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,32,1,power_law_1.2,0.06178560256958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,32,1,power_law_1.2,0.061875200271606444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,4,1,balanced,0.15129066507021585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,4,1,balanced,0.1532373329003652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,4,1,power_law_1.01,0.15626239776611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,4,1,power_law_1.01,0.16248320341110228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,4,1,power_law_1.2,0.16098560094833375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,4,1,power_law_1.2,0.16174720525741576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,8,1,balanced,0.09288533528645833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,8,1,balanced,0.09882666667302449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,8,1,power_law_1.01,0.09749119877815246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,8,1,power_law_1.01,0.09889280200004577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,8,1,power_law_1.2,0.09791359901428223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,16384,2,8,8,1,power_law_1.2,0.09858559966087341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,1,balanced,1.5462026596069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,1,balanced,1.5498827298482258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,1,power_law_1.01,1.2790207862854004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,1,power_law_1.01,1.304966354370117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,1,power_law_1.2,1.3079808235168457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,1,power_law_1.2,1.3339327812194823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,128,balanced,0.1523146629333496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,128,balanced,0.15239466230074564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,128,power_law_1.01,0.14963200092315673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,128,power_law_1.01,0.1513216018676758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,128,power_law_1.2,0.1508031964302063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,128,power_law_1.2,0.15121279954910277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,16,balanced,0.2400373419125875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,16,balanced,0.24045334259668985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,16,power_law_1.01,0.2290816068649292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,16,power_law_1.01,0.23374719619750978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,16,power_law_1.2,0.22334721088409423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,16,power_law_1.2,0.2344896078109741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,2,balanced,0.8551999727884928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,2,balanced,0.8580533663431803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,2,power_law_1.01,0.7283520221710205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,2,power_law_1.01,0.7369344234466553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,2,power_law_1.2,0.7314112186431885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,2,power_law_1.2,0.7331456184387207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,256,balanced,0.14944533507029215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,256,balanced,0.15001599987347922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,256,power_law_1.01,0.1482432007789612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,256,power_law_1.01,0.14841599464416505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,256,power_law_1.2,0.14788479804992677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,256,power_law_1.2,0.1482367992401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,32,balanced,0.18097599347432455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,32,power_law_1.01,0.17077759504318238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,32,power_law_1.01,0.17568000555038452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,32,power_law_1.2,0.17509119510650634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,32,power_law_1.2,0.1797760009765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,4,balanced,0.4987786610921224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,4,balanced,0.498960018157959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,4,power_law_1.01,0.463424015045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,4,power_law_1.01,0.4634560108184814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,4,power_law_1.2,0.4456639766693115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,4,power_law_1.2,0.46715521812438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,64,balanced,0.15853333473205566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,64,balanced,0.15878933668136597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,64,power_law_1.01,0.15652480125427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,64,power_law_1.01,0.15675519704818724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,64,power_law_1.2,0.15598080158233643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,64,power_law_1.2,0.15699199438095093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,8,balanced,0.3274453282356262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,8,balanced,0.32876267035802204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,8,power_law_1.01,0.2967679977416992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,8,power_law_1.01,0.31503360271453856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,8,power_law_1.2,0.30059518814086916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,1,8,power_law_1.2,0.31538560390472414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,16,1,balanced,0.24343466758728027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,16,1,balanced,0.24392000834147134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,16,1,power_law_1.01,0.20611839294433593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,16,1,power_law_1.01,0.21103999614715577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,16,1,power_law_1.2,0.2043776035308838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,16,1,power_law_1.2,0.20967040061950684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,2,1,balanced,0.8078933556874593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,2,1,balanced,0.8126880327860514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,2,1,power_law_1.01,0.688095998764038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,2,1,power_law_1.01,0.694547176361084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,2,1,power_law_1.2,0.689683198928833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,2,1,power_law_1.2,0.6967616081237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,32,1,balanced,0.20122132698694864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,32,1,balanced,0.203658660252889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,32,1,power_law_1.01,0.18586879968643188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,32,1,power_law_1.01,0.1863360047340393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,32,1,power_law_1.2,0.18584959506988524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,32,1,power_law_1.2,0.18608640432357787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,4,1,balanced,0.4680639902750651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,4,1,balanced,0.46854933102925617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,4,1,power_law_1.01,0.4018496036529541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,4,1,power_law_1.01,0.4065983772277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,4,1,power_law_1.2,0.4039616107940674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,4,1,power_law_1.2,0.4090752124786377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,8,1,balanced,0.3124426603317261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,8,1,balanced,0.3137120008468628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,8,1,power_law_1.01,0.2676032066345215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,8,1,power_law_1.01,0.271833610534668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,8,1,power_law_1.2,0.26784000396728513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2048,8,256,8,1,power_law_1.2,0.27238399982452394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,1,balanced,1.2220533688863118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,1,balanced,1.2303199768066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,1,power_law_1.01,1.1121983528137207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,1,power_law_1.01,1.1387519836425781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,1,power_law_1.2,1.1387200355529785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,1,power_law_1.2,1.1546815872192382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,16,balanced,0.19243200620015463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,16,balanced,0.19336533546447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,16,power_law_1.01,0.1828160047531128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,16,power_law_1.01,0.18376319408416747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,16,power_law_1.2,0.18448640108108522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,16,power_law_1.2,0.18747520446777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,2,balanced,0.6673866907755533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,2,balanced,0.6685439745585123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,2,power_law_1.01,0.6174208164215088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,2,power_law_1.01,0.6349503993988037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,2,power_law_1.2,0.6272255897521972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,2,power_law_1.2,0.6417215824127197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,32,balanced,0.13889599839846292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,32,balanced,0.13934399684270224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,32,power_law_1.01,0.13556480407714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,32,power_law_1.01,0.1366976022720337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,32,power_law_1.2,0.1356608033180237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,32,power_law_1.2,0.13654400110244752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,4,balanced,0.3958666721979777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,4,balanced,0.39769065380096436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,4,power_law_1.01,0.3649280071258545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,4,power_law_1.01,0.37895679473876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,4,power_law_1.2,0.3811903953552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,4,power_law_1.2,0.38273279666900634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,8,balanced,0.25781865914662677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,8,balanced,0.2605653405189514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,8,power_law_1.01,0.24657280445098878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,8,power_law_1.01,0.2497472047805786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,8,power_law_1.2,0.2403775930404663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,1,8,power_law_1.2,0.2518336057662964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,16,1,balanced,0.1985386610031128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,16,1,balanced,0.19941866397857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,16,1,power_law_1.01,0.1786239981651306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,16,1,power_law_1.01,0.17946239709854125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,16,1,power_law_1.2,0.17989120483398438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,16,1,power_law_1.2,0.1883520007133484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,2,1,balanced,0.6502559979756674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,2,1,balanced,0.6533706585566202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,2,1,power_law_1.01,0.592959976196289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,2,1,power_law_1.01,0.5957952022552491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,2,1,power_law_1.2,0.6109888076782226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,2,1,power_law_1.2,0.6162687778472901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,32,1,balanced,0.15590399503707886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,32,1,balanced,0.15654399991035461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,32,1,power_law_1.01,0.14860160350799562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,32,1,power_law_1.01,0.1490048050880432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,32,1,power_law_1.2,0.150764799118042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,32,1,power_law_1.2,0.15111680030822755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,4,1,balanced,0.37116265296936035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,4,1,balanced,0.3723893165588379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,4,1,power_law_1.01,0.34973440170288084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,4,1,power_law_1.01,0.3513983964920044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,4,1,power_law_1.2,0.3567039966583252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,4,1,power_law_1.2,0.3575551986694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,8,1,balanced,0.23718400796254477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,8,1,balanced,0.24012800057729086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,8,1,power_law_1.01,0.22480640411376954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,8,1,power_law_1.01,0.22618238925933837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,8,1,power_law_1.2,0.22731521129608154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,6144,2560,8,160,8,1,power_law_1.2,0.2283328056335449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,1,balanced,1.7934400240580242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,1,balanced,1.7989813486735027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,1,power_law_1.01,1.5159423828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,1,power_law_1.01,1.5226431846618653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,1,power_law_1.2,1.5421952247619628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,1,power_law_1.2,1.5768256187438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,128,balanced,0.1676959991455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,128,balanced,0.1678826610247294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,128,power_law_1.01,0.16497279405593873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,128,power_law_1.01,0.1650879979133606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,128,power_law_1.2,0.16490880250930787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,128,power_law_1.2,0.16517119407653807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,16,balanced,0.27236799399058026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,16,balanced,0.2724799911181132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,16,power_law_1.01,0.255295991897583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,16,power_law_1.01,0.25620479583740235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,16,power_law_1.2,0.24967041015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,16,power_law_1.2,0.26319360733032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,2,balanced,0.979477326075236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,2,balanced,0.9920106728871664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,2,power_law_1.01,0.862822437286377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,2,power_law_1.01,0.8730815887451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,2,power_law_1.2,0.8316543579101563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,2,power_law_1.2,0.8693056106567383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,256,balanced,0.1646453340848287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,256,balanced,0.1646880010763804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,256,power_law_1.01,0.1610751986503601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,256,power_law_1.01,0.16139520406723024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,256,power_law_1.2,0.16106879711151123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,256,power_law_1.2,0.16352640390396117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,32,balanced,0.20291733741760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,32,balanced,0.20359466473261514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,32,power_law_1.01,0.19608960151672364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,32,power_law_1.01,0.19726719856262206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,32,power_law_1.2,0.19273600578308106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,32,power_law_1.2,0.1993600010871887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,4,balanced,0.5710293451944987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,4,balanced,0.5717973311742147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,4,power_law_1.01,0.5130239963531494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,4,power_law_1.01,0.5272895812988281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,4,power_law_1.2,0.5098495960235596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,4,power_law_1.2,0.522163200378418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,64,balanced,0.17272533973058066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,64,balanced,0.17467733224232992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,64,power_law_1.01,0.17025920152664184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,64,power_law_1.01,0.17160320281982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,64,power_law_1.2,0.17107839584350587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,64,power_law_1.2,0.17166080474853515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,8,balanced,0.37139201164245605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,8,balanced,0.37546666463216144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,8,power_law_1.01,0.34323840141296386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,8,power_law_1.01,0.3609215974807739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,8,power_law_1.2,0.3313535928726196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,1,8,power_law_1.2,0.335699200630188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,16,1,balanced,0.2789280017217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,16,1,balanced,0.2790079911549886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,16,1,power_law_1.01,0.2323199987411499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,16,1,power_law_1.01,0.24113919734954833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,16,1,power_law_1.2,0.23395841121673583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,16,1,power_law_1.2,0.2346496105194092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,2,1,balanced,0.9414133230845133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,2,1,balanced,0.9420906702677408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,2,1,power_law_1.01,0.8037759780883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,2,1,power_law_1.01,0.8057663917541504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,2,1,power_law_1.2,0.8074239730834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,2,1,power_law_1.2,0.8133888244628906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,32,1,balanced,0.22802666823069254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,32,1,balanced,0.230512003103892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,32,1,power_law_1.01,0.21159679889678956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,32,1,power_law_1.01,0.21353600025177003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,32,1,power_law_1.2,0.2133375883102417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,32,1,power_law_1.2,0.21347200870513916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,4,1,balanced,0.5399146477381388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,4,1,balanced,0.5410773356755575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,4,1,power_law_1.01,0.46650238037109376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,4,1,power_law_1.01,0.4738304138183594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,4,1,power_law_1.2,0.4586304187774658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,4,1,power_law_1.2,0.46936960220336915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,8,1,balanced,0.36259734630584717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,8,1,balanced,0.36319998900095624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,8,1,power_law_1.01,0.30680959224700927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,8,1,power_law_1.01,0.30846080780029295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,8,1,power_law_1.2,0.3063231945037842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,256,8,1,power_law_1.2,0.3115648031234741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,1,balanced,2.736175855000814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,1,balanced,2.777791976928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,1,power_law_1.01,2.080940818786621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,1,power_law_1.01,2.0948352813720703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,1,power_law_1.2,2.01461124420166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,1,power_law_1.2,2.031737518310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,128,balanced,0.22588799397150675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,128,balanced,0.22605866193771362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,128,power_law_1.01,0.22422399520874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,128,power_law_1.01,0.2245311975479126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,128,power_law_1.2,0.22434558868408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,128,power_law_1.2,0.22469758987426758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,16,balanced,0.3698666493097941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,16,balanced,0.3710666497548421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,16,power_law_1.01,0.34179840087890623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,16,power_law_1.01,0.3420864105224609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,16,power_law_1.2,0.3347520112991333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,16,power_law_1.2,0.3371135950088501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,2,balanced,1.465269406636556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,2,balanced,1.4678719838460286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,2,power_law_1.01,1.1403648376464843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,2,power_law_1.01,1.2027456283569335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,2,power_law_1.2,1.091443157196045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,2,power_law_1.2,1.1612799644470215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,32,balanced,0.2895519932111104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,32,balanced,0.2903733253479004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,32,power_law_1.01,0.273907208442688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,32,power_law_1.01,0.27666559219360354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,32,power_law_1.2,0.26845440864562986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,32,power_law_1.2,0.271616005897522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,4,balanced,0.8270346323649088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,4,balanced,0.8304053147633871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,4,power_law_1.01,0.6962111949920654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,4,power_law_1.01,0.7390783786773681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,4,power_law_1.2,0.6610047817230225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,4,power_law_1.2,0.7169280052185059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,64,balanced,0.24037333329518637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,64,balanced,0.24213866392771402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,64,power_law_1.01,0.23418879508972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,64,power_law_1.01,0.23991041183471679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,64,power_law_1.2,0.23280000686645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,64,power_law_1.2,0.2390592098236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,8,balanced,0.5263413190841675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,8,balanced,0.5269333521525065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,8,power_law_1.01,0.4654911994934082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,8,power_law_1.01,0.4779263973236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,8,power_law_1.2,0.454585599899292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,1,8,power_law_1.2,0.46485118865966796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,16,1,balanced,0.369818647702535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,16,1,balanced,0.37034134070078534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,16,1,power_law_1.01,0.3273024082183838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,16,1,power_law_1.01,0.32875521183013917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,16,1,power_law_1.2,0.328108811378479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,16,1,power_law_1.2,0.32901759147644044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,2,1,balanced,1.3655999501546223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,2,1,balanced,1.3971999486287434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,2,1,power_law_1.01,1.0796159744262694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,2,1,power_law_1.01,1.0836607933044433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,2,1,power_law_1.2,1.0658559799194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,2,1,power_law_1.2,1.0823552131652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,32,1,balanced,0.3156426747639974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,32,1,balanced,0.31697599093119305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,32,1,power_law_1.01,0.2768831968307495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,32,1,power_law_1.01,0.27924480438232424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,32,1,power_law_1.2,0.2745599985122681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,32,1,power_law_1.2,0.27647359371185304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,4,1,balanced,0.773792028427124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,4,1,balanced,0.7764586607615153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,4,1,power_law_1.01,0.629036808013916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,4,1,power_law_1.01,0.6317759990692139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,4,1,power_law_1.2,0.6346816062927246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,4,1,power_law_1.2,0.6350848197937011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,8,1,balanced,0.5068639914194742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,8,1,balanced,0.5077919960021973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,8,1,power_law_1.01,0.4209023952484131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,8,1,power_law_1.01,0.42295041084289553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,8,1,power_law_1.2,0.4139391899108887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,160,7168,2048,8,384,8,1,power_law_1.2,0.4168831825256348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,1,balanced,1.5144160588582356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,1,balanced,1.5212799708048503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,1,power_law_1.01,1.5710463523864746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,1,power_law_1.01,1.5976703643798829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,1,power_law_1.2,1.5945023536682128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,1,power_law_1.2,1.6020288467407227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,128,balanced,0.8855360349019369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,128,balanced,0.8869120279947916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,128,power_law_1.01,0.9377984046936035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,128,power_law_1.01,0.9473535537719726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,128,power_law_1.2,0.9744192123413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,128,power_law_1.2,0.9745599746704101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,16,balanced,0.9297546545664469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,16,balanced,0.9306826591491699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,16,power_law_1.01,0.9956864356994629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,16,power_law_1.01,1.0278528213500977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,16,power_law_1.2,0.9933823585510254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,16,power_law_1.2,1.0470272064208985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,2,balanced,1.2750453154246013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,2,balanced,1.2792373498280842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,2,power_law_1.01,1.3310208320617676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,2,power_law_1.01,1.3375616073608398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,2,power_law_1.2,1.336627197265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,2,power_law_1.2,1.3608832359313965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,32,balanced,0.9047893683115641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,32,balanced,0.9071253140767416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,32,power_law_1.01,0.9546367645263671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,32,power_law_1.01,0.9712703704833985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,32,power_law_1.2,0.9993344306945801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,32,power_law_1.2,1.0003520011901856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,4,balanced,1.0711627006530762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,4,balanced,1.0862507025400798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,4,power_law_1.01,1.1665663719177246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,4,power_law_1.01,1.1705151557922364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,4,power_law_1.2,1.1471296310424806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,4,power_law_1.2,1.2163904190063477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,64,balanced,0.8929706414540609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,64,balanced,0.8939092953999838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,64,power_law_1.01,0.9446016311645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,64,power_law_1.01,0.9464192390441895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,64,power_law_1.2,0.9765055656433106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,64,power_law_1.2,1.019987201690674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,8,balanced,0.9763253529866537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,8,balanced,0.9792426427205404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,8,power_law_1.01,1.0510848045349122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,8,power_law_1.01,1.0601856231689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,8,power_law_1.2,1.0743616104125977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,1,8,power_law_1.2,1.113036823272705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,2,1,balanced,1.0819626649220784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,2,1,balanced,1.084229310353597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,2,1,power_law_1.01,1.1288384437561034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,2,1,power_law_1.01,1.1359807968139648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,2,1,power_law_1.2,1.1422464370727539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,2,1,power_law_1.2,1.1464127540588378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,4,1,balanced,0.9072960217793783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,4,1,balanced,0.9169493516286215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,4,1,power_law_1.01,0.9599807739257813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,4,1,power_law_1.01,0.961631965637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,4,1,power_law_1.2,0.9651200294494628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2048,768,8,128,4,1,power_law_1.2,0.9703871726989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,1,balanced,2.589786688486735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,1,balanced,2.7323039372762046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,1,power_law_1.01,2.7964288711547853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,1,power_law_1.01,2.818547248840332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,1,power_law_1.2,2.7599359512329102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,1,power_law_1.2,2.800179290771484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,128,balanced,1.1381066640218098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,128,balanced,1.1404053370157878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,128,power_law_1.01,1.2325440406799317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,128,power_law_1.01,1.23373441696167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,128,power_law_1.2,1.345024013519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,128,power_law_1.2,1.3589056015014649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,16,balanced,1.2313706874847412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,16,balanced,1.2368213335673015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,16,power_law_1.01,1.3511039733886718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,16,power_law_1.01,1.396134376525879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,16,power_law_1.2,1.4179776191711426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,16,power_law_1.2,1.4328703880310059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,2,balanced,1.9281973838806152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,2,balanced,1.9340373675028484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,2,power_law_1.01,2.0701183319091796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,2,power_law_1.01,2.111622428894043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,2,power_law_1.2,2.1205631256103517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,2,power_law_1.2,2.1254144668579102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,32,balanced,1.1774933338165283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,32,balanced,1.1789066791534424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,32,power_law_1.01,1.2820287704467774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,32,power_law_1.01,1.2826815605163575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,32,power_law_1.2,1.3637696266174317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,32,power_law_1.2,1.4212736129760741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,4,balanced,1.5302027066548665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,4,balanced,1.540778636932373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,4,power_law_1.01,1.6916799545288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,4,power_law_1.01,1.7191871643066405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,4,power_law_1.2,1.7376895904541017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,4,power_law_1.2,1.7924224853515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,64,balanced,1.1531733671824138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,64,balanced,1.1538986365000408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,64,power_law_1.01,1.2543295860290526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,64,power_law_1.01,1.2660096168518067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,64,power_law_1.2,1.3466943740844726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,64,power_law_1.2,1.3899200439453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,8,balanced,1.3271413644154866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,8,balanced,1.333194653193156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,8,power_law_1.01,1.5054143905639648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,8,power_law_1.01,1.5149824142456054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,8,power_law_1.2,1.5257984161376954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,1,8,power_law_1.2,1.5511808395385742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,16,1,balanced,4.582895914713542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,16,1,balanced,4.5848798751831055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,16,1,power_law_1.01,4.859737777709961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,16,1,power_law_1.01,4.876166534423828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,16,1,power_law_1.2,4.890675354003906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,16,1,power_law_1.2,4.903968048095703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,2,1,balanced,1.6699679692586262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,2,1,balanced,1.6752266883850098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,2,1,power_law_1.01,1.7730047225952148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,2,1,power_law_1.01,1.778700828552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,2,1,power_law_1.2,1.7771392822265626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,2,1,power_law_1.2,1.7886335372924804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,32,1,balanced,4.024335861206055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,32,1,balanced,4.026266733805339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,32,1,power_law_1.01,4.363910293579101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,32,1,power_law_1.01,4.376768112182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,32,1,power_law_1.2,4.385440063476563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,32,1,power_law_1.2,4.394233703613281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,4,1,balanced,1.2192533016204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,4,1,balanced,1.2196106910705566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,4,1,power_law_1.01,1.28603515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,4,1,power_law_1.01,1.2897664070129395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,4,1,power_law_1.2,1.305350399017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,4,1,power_law_1.2,1.3079551696777343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,8,1,balanced,5.904368082682292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,8,1,balanced,6.160111745198567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,8,1,power_law_1.01,6.322751998901367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,8,1,power_law_1.01,6.558815765380859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,8,1,power_law_1.2,6.591398620605469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,2688,1856,6,128,8,1,power_law_1.2,6.610892486572266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,1,balanced,3.378746668497721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,1,balanced,3.4089600245157876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,1,power_law_1.01,3.484729766845703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,1,power_law_1.01,3.52239990234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,1,power_law_1.2,3.578656005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,1,power_law_1.2,3.5801151275634764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,128,balanced,1.3321866989135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,128,balanced,1.332682689030965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,128,power_law_1.01,1.3966976165771485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,128,power_law_1.01,1.4044608116149901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,128,power_law_1.2,1.454195213317871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,128,power_law_1.2,1.4737279891967774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,16,balanced,1.4484799702962239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,16,balanced,1.4531839688618977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,16,power_law_1.01,1.5675456047058105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,16,power_law_1.01,1.593177604675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,16,power_law_1.2,1.6357311248779296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,16,power_law_1.2,1.6992576599121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,2,balanced,2.3650612831115723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,2,balanced,2.3707253138224282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,2,power_law_1.01,2.5913663864135743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,2,power_law_1.01,2.6319807052612303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,2,power_law_1.2,2.631494331359863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,2,power_law_1.2,2.658540725708008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,256,balanced,1.3226293722788494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,256,balanced,1.3252320289611816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,256,power_law_1.01,1.3907391548156738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,256,power_law_1.01,1.396230411529541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,256,power_law_1.2,1.463980770111084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,256,power_law_1.2,1.4700160026550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,32,balanced,1.3841759363810222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,32,balanced,1.3852052688598633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,32,power_law_1.01,1.490931224822998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,32,power_law_1.01,1.5285375595092774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,32,power_law_1.2,1.5303232192993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,32,power_law_1.2,1.5796159744262694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,4,balanced,1.849690596262614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,4,balanced,1.8535839716593425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,4,power_law_1.01,1.9825216293334962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,4,power_law_1.01,2.018931198120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,4,power_law_1.2,2.0818111419677736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,4,power_law_1.2,2.09866886138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,64,balanced,1.3480854034423828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,64,balanced,1.3497120539347331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,64,power_law_1.01,1.4278079986572265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,64,power_law_1.01,1.4542400360107421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,64,power_law_1.2,1.5193216323852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,64,power_law_1.2,1.536678409576416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,8,balanced,1.581925392150879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,8,balanced,1.5921707153320312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,8,power_law_1.01,1.7056896209716796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,8,power_law_1.01,1.7338111877441407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,8,power_law_1.2,1.7692224502563476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,1,8,power_law_1.2,1.810918426513672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,16,1,balanced,1.11898668607076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,16,1,balanced,1.1198826630910237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,16,1,power_law_1.01,1.1920703887939452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,16,1,power_law_1.01,1.1947711944580077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,16,1,power_law_1.2,1.203667163848877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,16,1,power_law_1.2,1.2061951637268067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,2,1,balanced,2.094538688659668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,2,1,balanced,2.099301338195801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,2,1,power_law_1.01,2.243577575683594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,2,1,power_law_1.01,2.246214485168457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,2,1,power_law_1.2,2.27270393371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,2,1,power_law_1.2,2.276006317138672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,32,1,balanced,1.0581119855244954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,32,1,balanced,1.062282641728719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,32,1,power_law_1.01,1.1223872184753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,32,1,power_law_1.01,1.1226559638977052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,32,1,power_law_1.2,1.1339136123657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,32,1,power_law_1.2,1.1339839935302733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,4,1,balanced,1.4855999946594238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,4,1,balanced,1.490224043528239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,4,1,power_law_1.01,1.587155246734619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,4,1,power_law_1.01,1.5881279945373534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,4,1,power_law_1.2,1.6013696670532227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,4,1,power_law_1.2,1.6052480697631837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,8,1,balanced,1.2558186848958333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,8,1,balanced,1.2575039863586426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,8,1,power_law_1.01,1.3275903701782226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,8,1,power_law_1.01,1.3290495872497559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,8,1,power_law_1.2,1.338163185119629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,3072,1536,8,256,8,1,power_law_1.2,1.3450559616088866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,1,balanced,7.877007802327474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,1,balanced,7.997247695922852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,1,power_law_1.01,7.8709564208984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,1,power_law_1.01,8.047122955322266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,1,power_law_1.2,7.950521850585938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,1,power_law_1.2,8.12520980834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,2,balanced,4.68233076731364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,2,balanced,4.687941233317058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,2,power_law_1.01,5.943180847167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,2,power_law_1.01,5.952684783935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,2,power_law_1.2,5.608153533935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,2,power_law_1.2,5.7485504150390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,4,balanced,3.2664267222086587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,4,balanced,3.2748053868611655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,4,power_law_1.01,4.538771057128907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,4,power_law_1.01,5.126233673095703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,4,power_law_1.2,4.6119232177734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,4,power_law_1.2,4.793529510498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,8,balanced,2.6221973101298013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,8,balanced,2.6317013104756675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,8,power_law_1.01,4.738393783569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,8,power_law_1.01,4.860083389282226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,8,power_law_1.2,4.89557113647461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,1,8,power_law_1.2,4.949676895141602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,16,1,balanced,0.7363733450571696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,16,1,balanced,0.7364319960276285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,16,1,power_law_1.01,0.743116807937622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,16,1,power_law_1.01,0.7477503776550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,16,1,power_law_1.2,0.7407360076904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,16,1,power_law_1.2,0.7449855804443359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,2,1,balanced,3.7539199193318686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,2,1,balanced,3.937727928161621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,2,1,power_law_1.01,3.589888000488281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,2,1,power_law_1.01,3.727123260498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,2,1,power_law_1.2,3.6254657745361327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,2,1,power_law_1.2,3.6721920013427733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,32,1,balanced,0.5590773423512777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,32,1,balanced,0.5689280033111572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,32,1,power_law_1.01,0.5699840068817139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,32,1,power_law_1.01,0.5731967926025391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,32,1,power_law_1.2,0.5772992134094238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,32,1,power_law_1.2,0.5797183990478516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,4,1,balanced,1.9268852869669597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,4,1,balanced,1.9742347399393718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,4,1,power_law_1.01,1.915167999267578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,4,1,power_law_1.01,1.931737518310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,4,1,power_law_1.2,1.9024576187133788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,4,1,power_law_1.2,1.944473648071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,8,1,balanced,1.102826674779256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,8,1,balanced,1.106533368428548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,8,1,power_law_1.01,1.107430362701416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,8,1,power_law_1.01,1.1338879585266113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,8,1,power_law_1.2,1.1343487739562987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,14336,2,8,8,1,power_law_1.2,1.1367039680480957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,1,balanced,4.0007626215616865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,1,balanced,4.051962534586589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,1,power_law_1.01,4.102252960205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,1,power_law_1.01,4.1684223175048825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,1,power_law_1.2,4.037503814697265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,1,power_law_1.2,4.090604782104492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,128,balanced,1.4982186953226726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,128,balanced,1.501706600189209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,128,power_law_1.01,1.6501184463500977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,128,power_law_1.01,1.6615104675292969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,128,power_law_1.2,1.766886329650879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,128,power_law_1.2,1.7865024566650392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,16,balanced,1.641482671101888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,16,balanced,1.6456640561421711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,16,power_law_1.01,1.8892223358154296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,16,power_law_1.01,1.893324851989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,16,power_law_1.2,1.988096046447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,16,power_law_1.2,2.0463743209838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,2,balanced,2.81058661142985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,2,balanced,2.8129599889119468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,2,power_law_1.01,3.00512638092041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,2,power_law_1.01,3.1350656509399415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,2,power_law_1.2,3.0180736541748048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,2,power_law_1.2,3.0497600555419924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,32,balanced,1.5562453269958496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,32,balanced,1.564784049987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,32,power_law_1.01,1.7450624465942384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,32,power_law_1.01,1.7623935699462892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,32,power_law_1.2,1.8342208862304688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,32,power_law_1.2,1.8817024230957031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,4,balanced,2.1436479886372886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,4,balanced,2.1476319630940757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,4,power_law_1.01,2.316985511779785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,4,power_law_1.01,2.3966144561767577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,4,power_law_1.2,2.39737606048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,4,power_law_1.2,2.4376384735107424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,64,balanced,1.518229325612386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,64,balanced,1.5213120778401692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,64,power_law_1.01,1.676755142211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,64,power_law_1.01,1.7290943145751954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,64,power_law_1.2,1.7799232482910157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,64,power_law_1.2,1.7863359451293945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,8,balanced,1.7994933128356934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,8,balanced,1.8036959966023762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,8,power_law_1.01,1.99420166015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,8,power_law_1.01,2.0425344467163087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,8,power_law_1.2,2.2032384872436523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,1,8,power_law_1.2,2.2388288497924806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,16,1,balanced,1.3768800099690754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,16,1,balanced,1.3809226353963215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,16,1,power_law_1.01,1.4414400100708007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,16,1,power_law_1.01,1.441823959350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,16,1,power_law_1.2,1.4450367927551269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,16,1,power_law_1.2,1.4508543968200684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,2,1,balanced,2.48797337214152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,2,1,balanced,2.554154713948568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,2,1,power_law_1.01,2.6168191909790037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,2,1,power_law_1.01,2.6174911499023437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,2,1,power_law_1.2,2.6429824829101562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,2,1,power_law_1.2,2.6511232376098635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,32,1,balanced,1.3045066992441814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,32,1,balanced,1.3046399752298992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,32,1,power_law_1.01,1.359347152709961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,32,1,power_law_1.01,1.3622271537780761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,32,1,power_law_1.2,1.3667263984680176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,32,1,power_law_1.2,1.3736512184143066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,4,1,balanced,1.7893919944763184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,4,1,balanced,1.794282595316569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,4,1,power_law_1.01,1.8791679382324218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,4,1,power_law_1.01,1.8929536819458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,4,1,power_law_1.2,1.8918464660644532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,4,1,power_law_1.2,1.9016447067260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,8,1,balanced,1.5359573364257812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,8,1,balanced,1.5387999216715496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,8,1,power_law_1.01,1.5921664237976074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,8,1,power_law_1.01,1.5970815658569335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,8,1,power_law_1.2,1.603660774230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,1536,8,128,8,1,power_law_1.2,1.609881591796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,1,balanced,19.65618642171224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,1,balanced,20.28011194864909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,1,power_law_1.01,19.906541442871095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,1,power_law_1.01,20.203065490722658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,1,power_law_1.2,19.535923767089844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,1,power_law_1.2,19.54589385986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,128,balanced,5.422890981038411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,128,balanced,5.4300587972005205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,128,power_law_1.01,5.667027282714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,128,power_law_1.01,5.708224105834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,128,power_law_1.2,5.8371326446533205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,128,power_law_1.2,5.9495361328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,16,balanced,6.161994934082031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,16,balanced,6.189525604248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,16,power_law_1.01,6.53359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,16,power_law_1.01,6.632729339599609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,16,power_law_1.2,6.8685760498046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,16,power_law_1.2,6.910380554199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,2,balanced,12.518917083740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,2,balanced,12.57525380452474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,2,power_law_1.01,13.288922119140626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,2,power_law_1.01,13.328153991699219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,2,power_law_1.2,13.187142944335937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,2,power_law_1.2,13.229356384277343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,256,balanced,5.3691361745198565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,256,balanced,5.372943878173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,256,power_law_1.01,5.557766342163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,256,power_law_1.01,5.6341503143310545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,256,power_law_1.2,5.752051162719726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,256,power_law_1.2,5.870073699951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,32,balanced,5.728768030802409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,32,balanced,5.764357248942058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,32,power_law_1.01,6.039673614501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,32,power_law_1.01,6.049516677856445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,32,power_law_1.2,6.312838363647461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,32,power_law_1.2,6.487776184082032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,4,balanced,8.577269236246744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,4,balanced,8.58889071146647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,4,power_law_1.01,8.850220489501954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,4,power_law_1.01,9.098016357421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,4,power_law_1.2,9.40597152709961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,4,power_law_1.2,9.706553649902343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,64,balanced,5.530991872151692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,64,balanced,5.532480239868164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,64,power_law_1.01,5.83941764831543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,64,power_law_1.01,5.895795059204102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,64,power_law_1.2,6.072256088256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,64,power_law_1.2,6.114003372192383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,8,balanced,7.047178904215495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,8,balanced,7.083386739095052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,8,power_law_1.01,7.3605506896972654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,8,power_law_1.01,7.519257354736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,8,power_law_1.2,7.649043273925781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,1,8,power_law_1.2,7.858918762207031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,16,1,balanced,32.59868876139323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,16,1,balanced,34.720532735188804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,16,1,power_law_1.01,34.911660766601564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,16,1,power_law_1.01,35.176107788085936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,16,1,power_law_1.2,35.001031494140626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,16,1,power_law_1.2,35.81314697265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,2,1,balanced,11.35986073811849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,2,1,balanced,11.404890696207682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,2,1,power_law_1.01,11.52327651977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,2,1,power_law_1.01,11.651321411132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,2,1,power_law_1.2,11.430585479736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,2,1,power_law_1.2,11.650624084472657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,32,1,balanced,23.678436279296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,32,1,balanced,24.075055440266926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,32,1,power_law_1.01,24.366796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,32,1,power_law_1.01,24.42674560546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,32,1,power_law_1.2,24.520658874511717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,32,1,power_law_1.2,24.622592163085937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,4,1,balanced,7.124266942342122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,4,1,balanced,7.210746765136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,4,1,power_law_1.01,7.287923431396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,4,1,power_law_1.01,7.315795135498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,4,1,power_law_1.2,7.138079833984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,4,1,power_law_1.2,7.229119873046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,8,1,balanced,5.167824109395345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,8,1,balanced,5.185402552286784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,8,1,power_law_1.01,5.154822540283203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,8,1,power_law_1.01,5.228435134887695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,8,1,power_law_1.2,5.235635375976562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,4096,2688,22,512,8,1,power_law_1.2,5.259999847412109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,1,balanced,12.890122731526693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,1,balanced,13.023136138916016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,1,power_law_1.01,12.603014373779297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,1,power_law_1.01,12.929362487792968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,1,power_law_1.2,12.811386108398438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,1,power_law_1.2,13.129306030273437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,2,balanced,7.247450510660808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,2,balanced,7.278495788574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,2,power_law_1.01,10.759814453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,2,power_law_1.01,9.742380523681641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,2,power_law_1.2,8.497702026367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,2,power_law_1.2,9.371443176269532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,4,balanced,4.532064119974772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,4,balanced,4.5675201416015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,4,power_law_1.01,7.403558349609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,4,power_law_1.01,7.621305847167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,4,power_law_1.2,7.306822204589844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,4,power_law_1.2,9.541395568847657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,8,balanced,3.367520014444987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,8,balanced,3.3764588038126626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,8,power_law_1.01,6.913676452636719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,8,power_law_1.01,7.026943969726562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,8,power_law_1.2,6.856838226318359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,1,8,power_law_1.2,7.276793670654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,16,1,balanced,1.0931946436564128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,16,1,balanced,1.1033973693847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,16,1,power_law_1.01,1.111302375793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,16,1,power_law_1.01,1.1188608169555665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,16,1,power_law_1.2,1.110105609893799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,16,1,power_law_1.2,1.114137554168701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,2,1,balanced,5.9914296468098955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,2,1,balanced,6.052480061848958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,2,1,power_law_1.01,5.928915023803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,2,1,power_law_1.01,6.044915390014649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,2,1,power_law_1.2,5.955174255371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,2,1,power_law_1.2,6.190464019775391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,32,1,balanced,0.8061386744181315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,32,1,balanced,0.8146613438924154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,32,1,power_law_1.01,0.8239935874938965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,32,1,power_law_1.01,0.828115177154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,32,1,power_law_1.2,0.8207807540893555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,32,1,power_law_1.2,0.8240639686584472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,4,1,balanced,3.1107358932495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,4,1,balanced,3.1436745325724282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,4,1,power_law_1.01,3.095897674560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,4,1,power_law_1.01,3.104812812805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,4,1,power_law_1.2,3.0084991455078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,4,1,power_law_1.2,3.123551940917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,8,1,balanced,1.6857439676920574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,8,1,balanced,1.724031925201416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,8,1,power_law_1.01,1.7138879776000977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,8,1,power_law_1.01,1.7418432235717773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,8,1,power_law_1.2,1.7273855209350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,16384,2,8,8,1,power_law_1.2,1.7299583435058594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,1,balanced,7.57591438293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,1,balanced,7.745381037394206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,1,power_law_1.01,8.364339447021484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,1,power_law_1.01,8.373811340332031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,1,power_law_1.2,8.459641265869141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,1,power_law_1.2,8.64150390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,128,balanced,2.1338186264038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,128,balanced,2.137615998586019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,128,power_law_1.01,2.323404884338379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,128,power_law_1.01,2.3375167846679688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,128,power_law_1.2,2.4731584548950196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,128,power_law_1.2,2.5010047912597657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,16,balanced,2.4210400581359863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,16,balanced,2.425253391265869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,16,power_law_1.01,2.7368896484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,16,power_law_1.01,2.742399978637695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,16,power_law_1.2,2.8657535552978515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,16,power_law_1.2,2.8983360290527345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,2,balanced,4.792250633239746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,2,balanced,4.86301326751709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,2,power_law_1.01,5.417478561401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,2,power_law_1.01,5.469145584106445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,2,power_law_1.2,5.358720016479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,2,power_law_1.2,5.441209411621093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,256,balanced,2.1133012771606445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,256,balanced,2.113605340321859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,256,power_law_1.01,2.2871679306030273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,256,power_law_1.01,2.2926399230957033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,256,power_law_1.2,2.465331268310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,256,power_law_1.2,2.5037952423095704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,32,balanced,2.2528212865193686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,32,balanced,2.257376035054525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,32,power_law_1.01,2.510553550720215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,32,power_law_1.01,2.5760255813598634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,32,power_law_1.2,2.669638442993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,32,power_law_1.2,2.6961727142333984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,4,balanced,3.4249439239501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,4,balanced,3.4499200185139975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,4,power_law_1.01,3.8719551086425783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,4,power_law_1.01,3.9825664520263673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,4,power_law_1.2,3.9509441375732424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,4,power_law_1.2,4.010879898071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,64,balanced,2.175253391265869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,64,balanced,2.184266726175944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,64,power_law_1.01,2.4178112030029295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,64,power_law_1.01,2.4343231201171873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,64,power_law_1.2,2.5390335083007813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,64,power_law_1.2,2.595583915710449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,8,balanced,2.733327865600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,8,balanced,2.7661174138387046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,8,power_law_1.01,3.0235647201538085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,8,power_law_1.01,3.1572992324829103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,8,power_law_1.2,3.189971160888672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,1,8,power_law_1.2,3.4784896850585936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,16,1,balanced,1.9832372665405273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,16,1,balanced,1.9871412913004558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,16,1,power_law_1.01,2.1021055221557616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,16,1,power_law_1.01,2.1033920288085937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,16,1,power_law_1.2,2.127097511291504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,16,1,power_law_1.2,2.132659149169922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,2,1,balanced,4.22818660736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,2,1,balanced,4.551674524943034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,2,1,power_law_1.01,4.768838500976562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,2,1,power_law_1.01,4.851692962646484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,2,1,power_law_1.2,4.759468841552734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,2,1,power_law_1.2,4.956076812744141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,32,1,balanced,1.8497120539347331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,32,1,balanced,1.8519093195597331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,32,1,power_law_1.01,1.9519487380981446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,32,1,power_law_1.01,1.9548095703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,32,1,power_law_1.2,1.9705856323242188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,32,1,power_law_1.2,1.975052833557129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,4,1,balanced,2.8956801096598306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,4,1,balanced,2.912416140238444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,4,1,power_law_1.01,3.145248031616211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,4,1,power_law_1.01,3.146348762512207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,4,1,power_law_1.2,3.14532470703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,4,1,power_law_1.2,3.1626943588256835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,8,1,balanced,2.2850186030069985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,8,1,balanced,2.2910025914510093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,8,1,power_law_1.01,2.432793617248535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,8,1,power_law_1.01,2.4368383407592775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,8,1,power_law_1.2,2.4572608947753904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2048,8,256,8,1,power_law_1.2,2.4640064239501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,1,balanced,9.242485046386719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,1,balanced,9.493216196695963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,1,power_law_1.01,9.314189147949218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,1,power_law_1.01,9.608678436279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,1,power_law_1.2,9.201670074462891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,1,power_law_1.2,9.374502563476563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,16,balanced,2.6691306432088218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,16,balanced,2.6778294245402017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,16,power_law_1.01,3.1159040451049806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,16,power_law_1.01,3.2044544219970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,16,power_law_1.2,3.2653377532958983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,16,power_law_1.2,3.3801345825195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,2,balanced,5.939770380655925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,2,balanced,5.984479904174805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,2,power_law_1.01,6.317433547973633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,2,power_law_1.01,6.332236862182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,2,power_law_1.2,6.245286560058593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,2,power_law_1.2,6.565190124511719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,32,balanced,2.4556479454040527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,32,balanced,2.4594666163126626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,32,power_law_1.01,2.801247978210449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,32,power_law_1.01,2.8540672302246093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,32,power_law_1.2,3.152998352050781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,32,power_law_1.2,3.1968063354492187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,4,balanced,3.9623839060465493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,4,balanced,3.9768854777018228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,4,power_law_1.01,4.391206359863281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,4,power_law_1.01,4.731059265136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,4,power_law_1.2,4.6180671691894535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,4,power_law_1.2,4.671871948242187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,8,balanced,3.096303939819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,8,balanced,3.097754796346029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,8,power_law_1.01,3.582304000854492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,8,power_law_1.01,3.680179214477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,8,power_law_1.2,3.84730224609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,1,8,power_law_1.2,3.8821441650390627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,16,1,balanced,2.225802739461263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,16,1,balanced,2.228501319885254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,16,1,power_law_1.01,2.256377601623535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,16,1,power_law_1.01,2.2565311431884765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,16,1,power_law_1.2,2.2661056518554688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,16,1,power_law_1.2,2.269126319885254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,2,1,balanced,5.327066739400228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,2,1,balanced,5.492410659790039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,2,1,power_law_1.01,5.147449493408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,2,1,power_law_1.01,5.326367950439453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,2,1,power_law_1.2,5.373785781860351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,2,1,power_law_1.2,5.427628707885742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,32,1,balanced,2.026858647664388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,32,1,balanced,2.02947203318278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,32,1,power_law_1.01,2.0528703689575196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,32,1,power_law_1.01,2.0548032760620116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,32,1,power_law_1.2,2.066655921936035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,32,1,power_law_1.2,2.0672576904296873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,4,1,balanced,3.3751678466796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,4,1,balanced,3.4629761377970376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,4,1,power_law_1.01,3.430054473876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,4,1,power_law_1.01,3.4313728332519533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,4,1,power_law_1.2,3.427878570556641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,4,1,power_law_1.2,3.4284927368164064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,8,1,balanced,2.537615935007731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,8,1,balanced,2.542448043823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,8,1,power_law_1.01,2.5684991836547852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,8,1,power_law_1.01,2.5808832168579103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,8,1,power_law_1.2,2.591814422607422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,6144,2560,8,160,8,1,power_law_1.2,2.5952320098876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,1,balanced,9.153327941894531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,1,balanced,9.220640182495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,1,power_law_1.01,9.567174530029297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,1,power_law_1.01,9.668978881835937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,1,power_law_1.2,10.130643463134765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,1,power_law_1.2,9.91994857788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,128,balanced,2.342048009236654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,128,balanced,2.350656032562256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,128,power_law_1.01,2.5568511962890623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,128,power_law_1.01,2.5638336181640624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,128,power_law_1.2,2.7285888671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,128,power_law_1.2,2.821824073791504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,16,balanced,2.680789311726888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,16,balanced,2.6828746795654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,16,power_law_1.01,3.0837440490722656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,16,power_law_1.01,3.101568031311035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,16,power_law_1.2,3.16627197265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,16,power_law_1.2,3.3904064178466795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,2,balanced,5.77723757425944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,2,balanced,5.842389424641927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,2,power_law_1.01,6.131584167480469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,2,power_law_1.01,6.251769638061523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,2,power_law_1.2,6.480345916748047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,2,power_law_1.2,6.759961700439453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,256,balanced,2.318042596181234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,256,balanced,2.318138599395752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,256,power_law_1.01,2.4974592208862303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,256,power_law_1.01,2.505107116699219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,256,power_law_1.2,2.7519359588623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,256,power_law_1.2,2.767398452758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,32,balanced,2.4827893575032554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,32,balanced,2.485978603363037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,32,power_law_1.01,2.7510400772094727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,32,power_law_1.01,2.8184768676757814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,32,power_law_1.2,2.9078847885131838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,32,power_law_1.2,3.1138559341430665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,4,balanced,3.865392049153646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,4,balanced,3.893653233846029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,4,power_law_1.01,4.4950721740722654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,4,power_law_1.01,4.546892929077148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,4,power_law_1.2,4.610335922241211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,4,power_law_1.2,4.669452667236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,64,balanced,2.386751969655355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,64,balanced,2.398021380106608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,64,power_law_1.01,2.633100891113281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,64,power_law_1.01,2.690995216369629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,64,power_law_1.2,2.8023168563842775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,64,power_law_1.2,2.983206367492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,8,balanced,3.0744053522745767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,8,balanced,3.0769173304239907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,8,power_law_1.01,3.5213504791259767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,8,power_law_1.01,3.5328449249267577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,8,power_law_1.2,3.7147201538085937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,1,8,power_law_1.2,3.739244842529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,16,1,balanced,2.2675894101460776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,16,1,balanced,2.269477367401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,16,1,power_law_1.01,2.4012224197387697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,16,1,power_law_1.01,2.4080448150634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,16,1,power_law_1.2,2.4253183364868165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,16,1,power_law_1.2,2.431443214416504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,2,1,balanced,5.159157435099284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,2,1,balanced,5.204954783121745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,2,1,power_law_1.01,5.5172161102294925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,2,1,power_law_1.01,5.559097671508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,2,1,power_law_1.2,5.548255920410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,2,1,power_law_1.2,5.594489669799804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,32,1,balanced,2.1127467155456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,32,1,balanced,2.112933317820231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,32,1,power_law_1.01,2.23370246887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,32,1,power_law_1.01,2.239033508300781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,32,1,power_law_1.2,2.254240036010742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,32,1,power_law_1.2,2.256947135925293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,4,1,balanced,3.313904126485189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,4,1,balanced,3.3416268030802407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,4,1,power_law_1.01,3.6015041351318358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,4,1,power_law_1.01,3.609017562866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,4,1,power_law_1.2,3.6012798309326173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,4,1,power_law_1.2,3.6270336151123046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,8,1,balanced,2.626453399658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,8,1,balanced,2.6268746058146157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,8,1,power_law_1.01,2.7948543548583986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,8,1,power_law_1.01,2.800953674316406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,8,1,power_law_1.2,2.81280632019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,256,8,1,power_law_1.2,2.820812797546387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,1,balanced,10.007786432902018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,1,balanced,9.688704172770182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,1,power_law_1.01,10.720563507080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,1,power_law_1.01,10.852153778076172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,1,power_law_1.2,10.951808166503906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,1,power_law_1.2,10.98603515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,128,balanced,2.4069493611653647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,128,balanced,2.407050609588623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,128,power_law_1.01,2.574143981933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,128,power_law_1.01,2.5817535400390623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,128,power_law_1.2,2.719487953186035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,128,power_law_1.2,2.7527999877929688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,16,balanced,2.7962398529052734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,16,balanced,2.8016532262166343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,16,power_law_1.01,3.0872447967529295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,16,power_law_1.01,3.104185676574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,16,power_law_1.2,3.2734912872314452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,16,power_law_1.2,3.3431678771972657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,2,balanced,6.131461461385091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,2,balanced,6.175439834594727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,2,power_law_1.01,6.701446533203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,2,power_law_1.01,6.800640106201172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,2,power_law_1.2,6.9722434997558596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,2,power_law_1.2,6.985081481933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,32,balanced,2.5748106638590493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,32,balanced,2.5759092966715493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,32,power_law_1.01,2.8007360458374024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,32,power_law_1.01,2.8795072555541994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,32,power_law_1.2,2.956582450866699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,32,power_law_1.2,2.985856056213379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,4,balanced,4.192709287007649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,4,balanced,4.207861264546712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,4,power_law_1.01,4.522553634643555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,4,power_law_1.01,4.546918487548828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,4,power_law_1.2,4.749465560913086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,4,power_law_1.2,4.957823944091797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,64,balanced,2.462117354075114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,64,balanced,2.4648586908976235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,64,power_law_1.01,2.6806400299072264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,64,power_law_1.01,2.6844928741455076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,64,power_law_1.2,2.8243200302124025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,64,power_law_1.2,2.870854377746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,8,balanced,3.266106605529785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,8,balanced,3.267786661783854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,8,power_law_1.01,3.560927963256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,8,power_law_1.01,3.614771270751953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,8,power_law_1.2,3.677939224243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,1,8,power_law_1.2,3.8540096282958984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,16,1,balanced,2.4458187421162925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,16,1,balanced,2.4470292727152505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,16,1,power_law_1.01,2.5111040115356444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,16,1,power_law_1.01,2.517651176452637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,16,1,power_law_1.2,2.5574207305908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,16,1,power_law_1.2,2.5574655532836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,2,1,balanced,5.675770441691081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,2,1,balanced,6.039791742960612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,2,1,power_law_1.01,5.983571243286133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,2,1,power_law_1.01,5.998284912109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,2,1,power_law_1.2,6.209478378295898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,2,1,power_law_1.2,6.2153984069824215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,32,1,balanced,2.24347194035848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,32,1,balanced,2.2438133557637534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,32,1,power_law_1.01,2.3336191177368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,32,1,power_law_1.01,2.3367935180664063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,32,1,power_law_1.2,2.361248016357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,32,1,power_law_1.2,2.365715217590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,4,1,balanced,3.6754239400227866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,4,1,balanced,3.7765067418416343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,4,1,power_law_1.01,3.805369567871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,4,1,power_law_1.01,3.9004352569580076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,4,1,power_law_1.2,3.9274559020996094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,4,1,power_law_1.2,3.954528045654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,8,1,balanced,2.867168108622233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,8,1,balanced,2.8717759450276694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,8,1,power_law_1.01,2.9442623138427733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,8,1,power_law_1.01,2.9551679611206056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,8,1,power_law_1.2,2.9901119232177735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,16384,7168,2048,8,384,8,1,power_law_1.2,3.005196762084961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,1,balanced,0.1493333379427592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,1,balanced,0.14961600303649902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,1,power_law_1.01,0.14218239784240722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,1,power_law_1.01,0.14338560104370118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,1,power_law_1.2,0.14204800128936768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,1,power_law_1.2,0.1424191951751709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,128,balanced,0.04994133114814758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,128,balanced,0.05032533407211304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,128,power_law_1.01,0.04885759949684143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,128,power_law_1.01,0.0491456001996994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,128,power_law_1.2,0.04907520115375519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,128,power_law_1.2,0.04943360090255737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,16,balanced,0.051829333106676735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,16,balanced,0.05187733471393585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,16,power_law_1.01,0.050355201959609984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,16,power_law_1.01,0.050758397579193114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,16,power_law_1.2,0.050758397579193114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,16,power_law_1.2,0.05076479911804199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,2,balanced,0.09944533308347066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,2,balanced,0.10019733508427937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,2,power_law_1.01,0.09723520278930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,2,power_law_1.01,0.09822720289230347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,2,power_law_1.2,0.0969983994960785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,2,power_law_1.2,0.09845119714736938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,32,balanced,0.05194666484991709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,32,balanced,0.05198933184146881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,32,power_law_1.01,0.04917120039463043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,32,power_law_1.01,0.04940159916877747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,32,power_law_1.2,0.049619200825691226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,32,power_law_1.2,0.05008000135421753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,4,balanced,0.07688533266385396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,4,balanced,0.0773119976123174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,4,power_law_1.01,0.0738431990146637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,4,power_law_1.01,0.07448319792747497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,4,power_law_1.2,0.07587839961051941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,4,power_law_1.2,0.0766207993030548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,64,balanced,0.04980266590913137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,64,balanced,0.05003199974695841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,64,power_law_1.01,0.047839999198913574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,64,power_law_1.01,0.04873600006103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,64,power_law_1.2,0.049107199907302855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,64,power_law_1.2,0.049446401000022885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,8,balanced,0.056015998125076294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,8,balanced,0.056458666920661926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,8,power_law_1.01,0.054150402545928955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,8,power_law_1.01,0.05605760216712952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,8,power_law_1.2,0.05685120224952698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,1,8,power_law_1.2,0.05726720094680786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,2,1,balanced,0.09817066788673401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,2,1,balanced,0.10009599725405376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,2,1,power_law_1.01,0.0945855975151062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,2,1,power_law_1.01,0.09631360173225403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,2,1,power_law_1.2,0.09658880233764648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,2,1,power_law_1.2,0.0969983994960785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,4,1,balanced,0.07623999814192454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,4,1,balanced,0.07654400169849396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,4,1,power_law_1.01,0.07324159741401673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,4,1,power_law_1.01,0.07420799732208253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,4,1,power_law_1.2,0.0738752007484436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2048,768,8,128,4,1,power_law_1.2,0.07548159956932068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,1,balanced,0.35622398058573407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,1,balanced,0.35753599802652997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,1,power_law_1.01,0.3264960050582886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,1,power_law_1.01,0.3342911958694458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,1,power_law_1.2,0.3412287950515747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,1,power_law_1.2,0.34472320079803465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,128,balanced,0.06649066507816315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,128,balanced,0.06715733309586842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,128,power_law_1.01,0.06615039706230164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,128,power_law_1.01,0.0664255976676941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,128,power_law_1.2,0.06624000072479248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,128,power_law_1.2,0.06632959842681885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,16,balanced,0.07998933394749959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,16,balanced,0.08038400113582611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,16,power_law_1.01,0.07650560140609741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,16,power_law_1.01,0.07694720029830933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,16,power_law_1.2,0.07671679854393006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,16,power_law_1.2,0.07812479734420777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,2,balanced,0.21793067455291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,2,balanced,0.22024534145991007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,2,power_law_1.01,0.19794559478759766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,2,power_law_1.01,0.20339839458465575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,2,power_law_1.2,0.21047039031982423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,2,power_law_1.2,0.21105918884277344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,32,balanced,0.06819733480612437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,32,balanced,0.07025599976380666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,32,power_law_1.01,0.06854400038719177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,32,power_law_1.01,0.06863359808921814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,32,power_law_1.2,0.06913920044898987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,32,power_law_1.2,0.0693120002746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,4,balanced,0.1448319951693217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,4,balanced,0.14623467127482095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,4,power_law_1.01,0.1376512050628662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,4,power_law_1.01,0.14012160301208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,4,power_law_1.2,0.14067840576171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,4,power_law_1.2,0.14161920547485352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,64,balanced,0.06822933256626129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,64,balanced,0.06846400101979573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,64,power_law_1.01,0.06600319743156433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,64,power_law_1.01,0.06678400039672852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,64,power_law_1.2,0.06635519862174988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,64,power_law_1.2,0.06689280271530151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,8,balanced,0.1074720025062561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,8,balanced,0.10806933045387268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,8,power_law_1.01,0.10050560235977173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,8,power_law_1.01,0.10193920135498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,8,power_law_1.2,0.10145920515060425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,1,8,power_law_1.2,0.10450559854507446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,16,1,balanced,0.326800008614858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,16,1,balanced,0.32973867654800415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,16,1,power_law_1.01,0.3014847993850708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,16,1,power_law_1.01,0.3050240039825439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,16,1,power_law_1.2,0.3079744100570679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,16,1,power_law_1.2,0.3121920108795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,2,1,balanced,0.20999467372894287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,2,1,balanced,0.2126880089441935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,2,1,power_law_1.01,0.19585280418395995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,2,1,power_law_1.01,0.19848320484161378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,2,1,power_law_1.2,0.1977280020713806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,2,1,power_law_1.2,0.20259199142456055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,32,1,balanced,0.2814026673634847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,32,1,balanced,0.2834026614824931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,32,1,power_law_1.01,0.2536191940307617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,32,1,power_law_1.01,0.25820159912109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,32,1,power_law_1.2,0.26754560470581057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,32,1,power_law_1.2,0.26829440593719484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,4,1,balanced,0.13844799995422363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,4,1,balanced,0.13940800229708353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,4,1,power_law_1.01,0.12861440181732178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,4,1,power_law_1.01,0.1319615960121155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,4,1,power_law_1.2,0.13023359775543214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,4,1,power_law_1.2,0.13127679824829103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,8,1,balanced,0.4246240059534709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,8,1,balanced,0.42635198434193927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,8,1,power_law_1.01,0.3905087947845459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,8,1,power_law_1.01,0.3933568000793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,8,1,power_law_1.2,0.39779200553894045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,2688,1856,6,128,8,1,power_law_1.2,0.40482559204101565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,1,balanced,0.6076533397038778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,1,balanced,0.6081173419952393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,1,power_law_1.01,0.5138751983642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,1,power_law_1.01,0.5296832084655761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,1,power_law_1.2,0.5239999771118165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,1,power_law_1.2,0.52674560546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,128,balanced,0.09912000099817912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,128,balanced,0.09913067022959392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,128,power_law_1.01,0.09842560291290284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,128,power_law_1.01,0.09857919812202454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,128,power_law_1.2,0.09828479886054993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,128,power_law_1.2,0.09847679734230042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,16,balanced,0.13403200109799704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,16,balanced,0.1343946655591329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,16,power_law_1.01,0.12444159984588624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,16,power_law_1.01,0.12717440128326415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,16,power_law_1.2,0.1233407974243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,16,power_law_1.2,0.12510080337524415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,2,balanced,0.35736000537872314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,2,balanced,0.3583253224690755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,2,power_law_1.01,0.31857919692993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,2,power_law_1.01,0.31994240283966063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,2,power_law_1.2,0.31674880981445314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,2,power_law_1.2,0.3232959985733032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,256,balanced,0.10084799925486247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,256,balanced,0.10090667009353638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,256,power_law_1.01,0.0990015983581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,256,power_law_1.01,0.09941759705543518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,256,power_law_1.2,0.0989247977733612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,256,power_law_1.2,0.09921919703483581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,32,balanced,0.1111253301302592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,32,balanced,0.11137066284815471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,32,power_law_1.01,0.10703999996185302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,32,power_law_1.01,0.10903040170669556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,32,power_law_1.2,0.10823680162429809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,32,power_law_1.2,0.1093951940536499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,4,balanced,0.23247466484705606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,4,balanced,0.23286932706832886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,4,power_law_1.01,0.20419840812683104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,4,power_law_1.01,0.2144831895828247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,4,power_law_1.2,0.21420800685882568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,4,power_law_1.2,0.22111999988555908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,64,balanced,0.1011893351872762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,64,balanced,0.10122666756312053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,64,power_law_1.01,0.10085120201110839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,64,power_law_1.01,0.10120320320129395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,64,power_law_1.2,0.10043519735336304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,64,power_law_1.2,0.10067839622497558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,8,balanced,0.16528000434239706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,8,balanced,0.16667733589808145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,8,power_law_1.01,0.154310405254364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,8,power_law_1.01,0.15567359924316407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,8,power_law_1.2,0.15162880420684816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,1,8,power_law_1.2,0.15689599514007568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,16,1,balanced,0.13385599851608276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,16,1,balanced,0.13570666313171387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,16,1,power_law_1.01,0.1152575969696045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,16,1,power_law_1.01,0.11711360216140747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,16,1,power_law_1.2,0.11699199676513672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,16,1,power_law_1.2,0.11758079528808593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,2,1,balanced,0.34119999408721924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,2,1,balanced,0.34187201658884686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,2,1,power_law_1.01,0.30192639827728274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,2,1,power_law_1.01,0.3019392013549805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,2,1,power_law_1.2,0.29601919651031494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,2,1,power_law_1.2,0.3020927906036377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,32,1,balanced,0.11343999703725179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,32,1,balanced,0.11353600025177002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,32,1,power_law_1.01,0.10556800365447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,32,1,power_law_1.01,0.10558719635009765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,32,1,power_law_1.2,0.10437120199203491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,32,1,power_law_1.2,0.1053056001663208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,4,1,balanced,0.21766400337219238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,4,1,balanced,0.2200160026550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,4,1,power_law_1.01,0.18838399648666382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,4,1,power_law_1.01,0.1929471969604492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,4,1,power_law_1.2,0.192684805393219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,4,1,power_law_1.2,0.19342080354690552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,8,1,balanced,0.15773333112398782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,8,1,balanced,0.15780799587567648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,8,1,power_law_1.01,0.14325759410858155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,8,1,power_law_1.01,0.14510719776153563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,8,1,power_law_1.2,0.1444991946220398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,3072,1536,8,256,8,1,power_law_1.2,0.14585599899291993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,1,balanced,0.29013333717981976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,1,balanced,0.2940426667531331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,1,power_law_1.01,0.3263488054275513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,1,power_law_1.01,0.331712007522583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,1,power_law_1.2,0.32334721088409424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,1,power_law_1.2,0.33527040481567383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,2,balanced,0.2055466572443644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,2,balanced,0.20602132876714072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,2,power_law_1.01,0.22734079360961915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,2,power_law_1.01,0.2377023935317993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,2,power_law_1.2,0.22784640789031982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,2,power_law_1.2,0.2318592071533203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,4,balanced,0.16431466738382974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,4,balanced,0.16517866651217142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,4,power_law_1.01,0.17958400249481202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,4,power_law_1.01,0.1840000033378601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,4,power_law_1.2,0.18182400465011597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,4,power_law_1.2,0.1878399968147278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,8,balanced,0.14755733807881674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,8,balanced,0.14784000317255655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,8,power_law_1.01,0.15800960063934327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,8,power_law_1.01,0.15892479419708253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,8,power_law_1.2,0.15681920051574708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,1,8,power_law_1.2,0.15984640121459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,16,1,balanced,0.05193600058555603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,16,1,balanced,0.05194133520126343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,16,1,power_law_1.01,0.05619199872016907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,16,1,power_law_1.01,0.05730559825897217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,16,1,power_law_1.2,0.05504000186920166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,16,1,power_law_1.2,0.0574400007724762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,2,1,balanced,0.17018133401870728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,2,1,balanced,0.17226133743921915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,2,1,power_law_1.01,0.17267839908599852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,2,1,power_law_1.01,0.17537920475006102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,2,1,power_law_1.2,0.17857919931411742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,2,1,power_law_1.2,0.18047360181808472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,32,1,balanced,0.04110399881998698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,32,1,balanced,0.041365332901477814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,32,1,power_law_1.01,0.041465601325035094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,32,1,power_law_1.01,0.04147840142250061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,32,1,power_law_1.2,0.04168959856033325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,32,1,power_law_1.2,0.04226559996604919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,4,1,balanced,0.10894933342933655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,4,1,balanced,0.10950400431950887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,4,1,power_law_1.01,0.1085055947303772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,4,1,power_law_1.01,0.10944000482559205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,4,1,power_law_1.2,0.10855679512023926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,4,1,power_law_1.2,0.10884480476379395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,8,1,balanced,0.07226666808128357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,8,1,balanced,0.07419200241565704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,8,1,power_law_1.01,0.07095680236816407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,8,1,power_law_1.01,0.0718720018863678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,8,1,power_law_1.2,0.07086719870567322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,14336,2,8,8,1,power_law_1.2,0.07119359970092773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,1,balanced,0.42604267597198486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,1,balanced,0.4273013273874919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,1,power_law_1.01,0.4122176170349121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,1,power_law_1.01,0.4133632183074951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,1,power_law_1.2,0.4160639762878418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,1,power_law_1.2,0.41948161125183103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,128,balanced,0.07853866616884868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,128,balanced,0.07893333335717519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,128,power_law_1.01,0.07701119780540466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,128,power_law_1.01,0.0774399995803833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,128,power_law_1.2,0.07761920094490052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,128,power_law_1.2,0.0779583990573883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,16,balanced,0.09345066547393799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,16,balanced,0.09346666932106018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,16,power_law_1.01,0.09136000275611877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,16,power_law_1.01,0.09175040125846863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,16,power_law_1.2,0.09264640212059021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,16,power_law_1.2,0.09365760087966919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,2,balanced,0.25564799706141156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,2,balanced,0.25758399566014606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,2,power_law_1.01,0.2506752014160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,2,power_law_1.01,0.2517568111419678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,2,power_law_1.2,0.24827520847320556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,2,power_law_1.2,0.2539263963699341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,32,balanced,0.08250666658083598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,32,balanced,0.08458133538564046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,32,power_law_1.01,0.08255360126495362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,32,power_law_1.01,0.08366079926490784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,32,power_law_1.2,0.08204799890518188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,32,power_law_1.2,0.08365439772605895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,4,balanced,0.16404267152150473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,4,balanced,0.16449066996574402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,4,power_law_1.01,0.16053760051727295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,4,power_law_1.01,0.16167039871215821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,4,power_law_1.2,0.1613759994506836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,4,power_law_1.2,0.16176639795303344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,64,balanced,0.0783679982026418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,64,balanced,0.07839466631412506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,64,power_law_1.01,0.07750399708747864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,64,power_law_1.01,0.07779840230941773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,64,power_law_1.2,0.0784063994884491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,64,power_law_1.2,0.07850880026817322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,8,balanced,0.12277866403261821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,8,balanced,0.12335999806722005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,8,power_law_1.01,0.1212928056716919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,8,power_law_1.01,0.12166399955749511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,8,power_law_1.2,0.1207808017730713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,1,8,power_law_1.2,0.12329599857330323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,16,1,balanced,0.10195199648539226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,16,1,balanced,0.10214400291442871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,16,1,power_law_1.01,0.09987840056419373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,16,1,power_law_1.01,0.10008959770202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,16,1,power_law_1.2,0.10030080080032348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,16,1,power_law_1.2,0.10202239751815796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,2,1,balanced,0.24712000290552774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,2,1,balanced,0.2500586708386739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,2,1,power_law_1.01,0.2406399965286255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,2,1,power_law_1.01,0.24196479320526124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,2,1,power_law_1.2,0.23975040912628173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,2,1,power_law_1.2,0.24048640727996826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,32,1,balanced,0.09175466497739156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,32,1,balanced,0.09368000427881877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,32,1,power_law_1.01,0.08970879912376403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,32,1,power_law_1.01,0.09000959992408752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,32,1,power_law_1.2,0.09059839844703674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,32,1,power_law_1.2,0.09182720184326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,4,1,balanced,0.15901866555213928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,4,1,balanced,0.1609119971593221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,4,1,power_law_1.01,0.15370240211486816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,4,1,power_law_1.01,0.1539520025253296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,4,1,power_law_1.2,0.15562880039215088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,4,1,power_law_1.2,0.15688960552215575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,8,1,balanced,0.11898133158683777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,8,1,balanced,0.12111467123031616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,8,1,power_law_1.01,0.11626240015029907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,8,1,power_law_1.01,0.11737600564956666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,8,1,power_law_1.2,0.11783039569854736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,1536,8,128,8,1,power_law_1.2,0.11870720386505126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,1,balanced,2.686885197957357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,1,balanced,2.6924959818522134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,1,power_law_1.01,2.4441919326782227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,1,power_law_1.01,2.467238426208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,1,power_law_1.2,2.505740737915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,1,power_law_1.2,2.530643272399902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,128,balanced,0.29334932565689087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,128,balanced,0.29345067342122394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,128,power_law_1.01,0.2912447929382324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,128,power_law_1.01,0.29155840873718264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,128,power_law_1.2,0.28998401165008547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,128,power_law_1.2,0.2926016092300415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,16,balanced,0.4529973268508911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,16,balanced,0.4533066749572754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,16,power_law_1.01,0.43722238540649416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,16,power_law_1.01,0.43824000358581544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,16,power_law_1.2,0.44269437789916993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,16,power_law_1.2,0.44408321380615234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,2,balanced,1.4950879414876301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,2,balanced,1.5012747446695964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,2,power_law_1.01,1.3669055938720702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,2,power_law_1.01,1.3796352386474608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,2,power_law_1.2,1.3936896324157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,2,power_law_1.2,1.4044608116149901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,256,balanced,0.2874613404273987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,256,balanced,0.28945066531499225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,256,power_law_1.01,0.2865855932235718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,256,power_law_1.01,0.2867647886276245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,256,power_law_1.2,0.2860480070114136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,256,power_law_1.2,0.28614399433135984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,32,balanced,0.36609601974487305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,32,balanced,0.36906667550404865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,32,power_law_1.01,0.3612096071243286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,32,power_law_1.01,0.3637183904647827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,32,power_law_1.2,0.3612735986709595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,32,power_law_1.2,0.36627199649810793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,4,balanced,0.9016746679941813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,4,balanced,0.9050079981486002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,4,power_law_1.01,0.8255359649658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,4,power_law_1.01,0.860319995880127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,4,power_law_1.2,0.8518336296081543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,4,power_law_1.2,0.8582207679748535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,64,balanced,0.3144693374633789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,64,balanced,0.3155893286069234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,64,power_law_1.01,0.310918402671814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,64,power_law_1.01,0.31176319122314455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,64,power_law_1.2,0.30719358921051027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,64,power_law_1.2,0.3118527889251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,8,balanced,0.6024479866027832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,8,balanced,0.6045706669489542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,8,power_law_1.01,0.5701759815216064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,8,power_law_1.01,0.5826879978179932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,8,power_law_1.2,0.5772928237915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,1,8,power_law_1.2,0.578764820098877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,16,1,balanced,2.2896374066670737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,16,1,balanced,2.2896906534830728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,16,1,power_law_1.01,2.0448575973510743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,16,1,power_law_1.01,2.0700159072875977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,16,1,power_law_1.2,2.0796159744262694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,16,1,power_law_1.2,2.1328128814697265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,2,1,balanced,1.4050933519999187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,2,1,balanced,1.4467573165893555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,2,1,power_law_1.01,1.2611136436462402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,2,1,power_law_1.01,1.2725055694580079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,2,1,power_law_1.2,1.2921792030334474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,2,1,power_law_1.2,1.302348804473877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,32,1,balanced,1.7743412653605144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,32,1,balanced,1.7790719668070476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,32,1,power_law_1.01,1.6108352661132812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,32,1,power_law_1.01,1.6188928604125976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,32,1,power_law_1.2,1.6513984680175782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,32,1,power_law_1.2,1.6559551239013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,4,1,balanced,0.8011946678161621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,4,1,balanced,0.8030453523000082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,4,1,power_law_1.01,0.727948808670044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,4,1,power_law_1.01,0.7333248138427735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,4,1,power_law_1.2,0.747705602645874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,4,1,power_law_1.2,0.7503935813903808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,8,1,balanced,0.5003999869028727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,8,1,balanced,0.5011946757634481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,8,1,power_law_1.01,0.4633471965789795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,8,1,power_law_1.01,0.46959362030029295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,8,1,power_law_1.2,0.46990718841552737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,4096,2688,22,512,8,1,power_law_1.2,0.4726719856262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,1,balanced,0.4370559851328532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,1,balanced,0.4389280080795288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,1,power_law_1.01,0.5316736221313476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,1,power_law_1.01,0.5523839950561523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,1,power_law_1.2,0.5445759773254395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,1,power_law_1.2,0.5619584083557129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,2,balanced,0.28377066055933636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,2,balanced,0.28563199440638226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,2,power_law_1.01,0.32286720275878905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,2,power_law_1.01,0.32731521129608154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,2,power_law_1.2,0.33386878967285155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,2,power_law_1.2,0.3420736074447632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,4,balanced,0.21183466911315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,4,balanced,0.21210134029388428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,4,power_law_1.01,0.2355072021484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,4,power_law_1.01,0.2401279926300049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,4,power_law_1.2,0.237990403175354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,4,power_law_1.2,0.25063679218292234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,8,balanced,0.17868266503016153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,8,balanced,0.18242132663726807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,8,power_law_1.01,0.19600640535354613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,8,power_law_1.01,0.19604480266571045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,8,power_law_1.2,0.19196159839630128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,1,8,power_law_1.2,0.19909119606018066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,16,1,balanced,0.0747573326031367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,16,1,balanced,0.08055466910203297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,16,1,power_law_1.01,0.07991679906845092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,16,1,power_law_1.01,0.08000640273094177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,16,1,power_law_1.2,0.0790336012840271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,16,1,power_law_1.2,0.07927680015563965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,2,1,balanced,0.25273066759109497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,2,1,balanced,0.25278399387995404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,2,1,power_law_1.01,0.27705600261688235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,2,1,power_law_1.01,0.29303679466247556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,2,1,power_law_1.2,0.2867840051651001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,2,1,power_law_1.2,0.2945215940475464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,32,1,balanced,0.05614933371543884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,32,1,balanced,0.05813866853713989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,32,1,power_law_1.01,0.06542080044746398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,32,1,power_law_1.01,0.06595839858055115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,32,1,power_law_1.2,0.06255360245704651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,32,1,power_law_1.2,0.06276479959487916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,4,1,balanced,0.15172266960144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,4,1,balanced,0.15499732891718546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,4,1,power_law_1.01,0.1614143967628479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,4,1,power_law_1.01,0.16467200517654418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,4,1,power_law_1.2,0.16300159692764282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,4,1,power_law_1.2,0.16328959465026854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,8,1,balanced,0.09620267152786255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,8,1,balanced,0.0976693332195282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,8,1,power_law_1.01,0.09921919703483581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,8,1,power_law_1.01,0.10020480155944825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,8,1,power_law_1.2,0.09954559803009033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,16384,2,8,8,1,power_law_1.2,0.10099200010299683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,1,balanced,1.5515252749125164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,1,balanced,1.5703253746032715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,1,power_law_1.01,1.3232064247131348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,1,power_law_1.01,1.3346303939819335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,1,power_law_1.2,1.3329792022705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,1,power_law_1.2,1.3631168365478517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,128,balanced,0.1581439971923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,128,balanced,0.1585653324921926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,128,power_law_1.01,0.15571199655532836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,128,power_law_1.01,0.15605759620666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,128,power_law_1.2,0.15597440004348756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,128,power_law_1.2,0.15633280277252198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,16,balanced,0.2446133295694987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,16,balanced,0.24470933278401694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,16,power_law_1.01,0.2407680034637451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,16,power_law_1.01,0.24226560592651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,16,power_law_1.2,0.22721281051635742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,16,power_law_1.2,0.2295936107635498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,2,balanced,0.860426664352417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,2,balanced,0.8634773095448812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,2,power_law_1.01,0.7308991909027099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,2,power_law_1.01,0.7596928119659424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,2,power_law_1.2,0.7445184230804444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,2,power_law_1.2,0.7744703769683838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,256,balanced,0.1541920006275177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,256,balanced,0.15432000160217285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,256,power_law_1.01,0.15238399505615235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,256,power_law_1.01,0.15293439626693725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,256,power_law_1.2,0.15247360467910767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,256,power_law_1.2,0.15448960065841674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,32,balanced,0.18547733624776205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,32,balanced,0.18698134024937949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,32,power_law_1.01,0.17761919498443604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,32,power_law_1.01,0.1847808003425598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,32,power_law_1.2,0.17867519855499267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,32,power_law_1.2,0.17893760204315184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,4,balanced,0.503104011217753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,4,balanced,0.5053226550420126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,4,power_law_1.01,0.45240960121154783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,4,power_law_1.01,0.46869120597839353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,4,power_law_1.2,0.46379518508911133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,4,power_law_1.2,0.4675903797149658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,64,balanced,0.16245333353678384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,64,balanced,0.16474133729934692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,64,power_law_1.01,0.16097919940948485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,64,power_law_1.01,0.161190402507782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,64,power_law_1.2,0.16072319746017455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,64,power_law_1.2,0.16090240478515624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,8,balanced,0.33083200454711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,8,balanced,0.332586665948232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,8,power_law_1.01,0.3060096025466919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,8,power_law_1.01,0.31855359077453616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,8,power_law_1.2,0.2955008029937744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,1,8,power_law_1.2,0.30030720233917235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,16,1,balanced,0.24460800488789877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,16,1,balanced,0.24648000796635947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,16,1,power_law_1.01,0.2092672109603882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,16,1,power_law_1.01,0.21269121170043945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,16,1,power_law_1.2,0.21066880226135254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,16,1,power_law_1.2,0.21328001022338866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,2,1,balanced,0.8119093577067057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,2,1,balanced,0.8167306582132975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,2,1,power_law_1.01,0.7085440158843994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,2,1,power_law_1.01,0.7100160121917725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,2,1,power_law_1.2,0.7011839866638183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,2,1,power_law_1.2,0.70796799659729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,32,1,balanced,0.20373332500457764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,32,1,balanced,0.20376000801722208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,32,1,power_law_1.01,0.18915200233459473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,32,1,power_law_1.01,0.19056639671325684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,32,1,power_law_1.2,0.18984320163726806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,32,1,power_law_1.2,0.1912511944770813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,4,1,balanced,0.4702719847361247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,4,1,balanced,0.4707039992014567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,4,1,power_law_1.01,0.41603841781616213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,4,1,power_law_1.01,0.4163968086242676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,4,1,power_law_1.2,0.4204864025115967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,4,1,power_law_1.2,0.4260608196258545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,8,1,balanced,0.3166933258374532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,8,1,balanced,0.3171253403027852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,8,1,power_law_1.01,0.2710335969924927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,8,1,power_law_1.01,0.2711679935455322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,8,1,power_law_1.2,0.2777600049972534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2048,8,256,8,1,power_law_1.2,0.28487679958343504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,1,balanced,1.2257440090179443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,1,balanced,1.2360426584879558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,1,power_law_1.01,1.126963233947754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,1,power_law_1.01,1.133407974243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,1,power_law_1.2,1.1533632278442383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,1,power_law_1.2,1.1623359680175782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,16,balanced,0.19756799936294556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,16,balanced,0.19858133792877197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,16,power_law_1.01,0.1914944052696228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,16,power_law_1.01,0.1955072045326233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,16,power_law_1.2,0.183078396320343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,16,power_law_1.2,0.19872000217437744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,2,balanced,0.6726240317026774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,2,balanced,0.6726453304290771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,2,power_law_1.01,0.6304704189300537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,2,power_law_1.01,0.6403903961181641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,2,power_law_1.2,0.6425407886505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,2,power_law_1.2,0.6533696174621582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,32,balanced,0.14070399602254233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,32,balanced,0.14241066575050354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,32,power_law_1.01,0.1390720009803772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,32,power_law_1.01,0.14044159650802612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,32,power_law_1.2,0.1397055983543396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,32,power_law_1.2,0.14012800455093383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,4,balanced,0.4004266659418742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,4,balanced,0.40141868591308594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,4,power_law_1.01,0.37519359588623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,4,power_law_1.01,0.38188159465789795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,4,power_law_1.2,0.38511359691619873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,4,power_law_1.2,0.3923007965087891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,8,balanced,0.26453866561253864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,8,balanced,0.264789342880249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,8,power_law_1.01,0.24775679111480714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,8,power_law_1.01,0.25735039710998536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,8,power_law_1.2,0.25017600059509276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,1,8,power_law_1.2,0.26083199977874755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,16,1,balanced,0.20097066958745322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,16,1,balanced,0.20193066199620566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,16,1,power_law_1.01,0.17361279726028442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,16,1,power_law_1.01,0.1772480010986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,16,1,power_law_1.2,0.18255360126495362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,16,1,power_law_1.2,0.19107199907302858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,2,1,balanced,0.6535893281300863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,2,1,balanced,0.6585599978764852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,2,1,power_law_1.01,0.5980031967163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,2,1,power_law_1.01,0.6098048210144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,2,1,power_law_1.2,0.618291187286377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,2,1,power_law_1.2,0.6231040000915528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,32,1,balanced,0.1585760017236074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,32,1,balanced,0.15927466750144958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,32,1,power_law_1.01,0.15140479803085327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,32,1,power_law_1.01,0.15235840082168578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,32,1,power_law_1.2,0.15308159589767456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,32,1,power_law_1.2,0.1543936014175415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,4,1,balanced,0.3738613526026408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,4,1,balanced,0.37437868118286133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,4,1,power_law_1.01,0.35323519706726075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,4,1,power_law_1.01,0.3586751937866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,4,1,power_law_1.2,0.36072959899902346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,4,1,power_law_1.2,0.3645375967025757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,8,1,balanced,0.2408426602681478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,8,1,balanced,0.24084800481796265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,8,1,power_law_1.01,0.22927360534667968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,8,1,power_law_1.01,0.23036160469055175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,8,1,power_law_1.2,0.232857608795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,6144,2560,8,160,8,1,power_law_1.2,0.23454720973968507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,1,balanced,1.8008960088094075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,1,balanced,1.8025973637898762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,1,power_law_1.01,1.5298879623413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,1,power_law_1.01,1.5374272346496582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,1,power_law_1.2,1.5738368034362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,1,power_law_1.2,1.579423999786377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,128,balanced,0.17230399449666342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,128,balanced,0.17277334133783975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,128,power_law_1.01,0.16992640495300293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,128,power_law_1.01,0.1705024003982544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,128,power_law_1.2,0.17088639736175537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,128,power_law_1.2,0.17114880084991455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,16,balanced,0.27928000688552856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,16,balanced,0.28097599744796753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,16,power_law_1.01,0.26124799251556396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,16,power_law_1.01,0.26727681159973143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,16,power_law_1.2,0.2644736051559448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,16,power_law_1.2,0.2710911989212036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,2,balanced,0.9856320222218832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,2,balanced,0.9920266469319662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,2,power_law_1.01,0.8557951927185059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,2,power_law_1.01,0.8850751876831054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,2,power_law_1.2,0.8697919845581055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,2,power_law_1.2,0.8824383735656738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,256,balanced,0.16874132553736368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,256,balanced,0.1697653333346049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,256,power_law_1.01,0.16695040464401245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,256,power_law_1.01,0.16743040084838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,256,power_law_1.2,0.16625920534133912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,256,power_law_1.2,0.1697216033935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,32,balanced,0.2100320061047872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,32,balanced,0.21161067485809326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,32,power_law_1.01,0.20365440845489502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,32,power_law_1.01,0.20599040985107422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,32,power_law_1.2,0.19854719638824464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,32,power_law_1.2,0.2035775899887085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,4,balanced,0.5771413246790568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,4,balanced,0.5800640185674032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,4,power_law_1.01,0.5160895824432373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,4,power_law_1.01,0.5183231830596924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,4,power_law_1.2,0.5123519897460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,4,power_law_1.2,0.5376128196716309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,64,balanced,0.17824532588322958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,64,balanced,0.1787466605504354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,64,power_law_1.01,0.17562240362167358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,64,power_law_1.01,0.17638399600982665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,64,power_law_1.2,0.17582080364227295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,64,power_law_1.2,0.17663999795913696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,8,balanced,0.3785546620686849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,8,balanced,0.3837120135625203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,8,power_law_1.01,0.350547194480896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,8,power_law_1.01,0.35818240642547605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,8,power_law_1.2,0.35255041122436526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,1,8,power_law_1.2,0.3540800094604492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,16,1,balanced,0.2815999984741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,16,1,balanced,0.2830880085627238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,16,1,power_law_1.01,0.24014079570770264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,16,1,power_law_1.01,0.24519040584564208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,16,1,power_law_1.2,0.2395967960357666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,16,1,power_law_1.2,0.24664320945739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,2,1,balanced,0.9474133650461832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,2,1,balanced,0.9737866719563802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,2,1,power_law_1.01,0.8113727569580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,2,1,power_law_1.01,0.8199359893798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,2,1,power_law_1.2,0.8114175796508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,2,1,power_law_1.2,0.8349696159362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,32,1,balanced,0.23221333821614584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,32,1,balanced,0.233024001121521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,32,1,power_law_1.01,0.21685121059417725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,32,1,power_law_1.01,0.21835520267486572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,32,1,power_law_1.2,0.21537280082702637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,32,1,power_law_1.2,0.21882240772247313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,4,1,balanced,0.5450239976247152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,4,1,balanced,0.5463360150655111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,4,1,power_law_1.01,0.48024959564208985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,4,1,power_law_1.01,0.4844031810760498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,4,1,power_law_1.2,0.47950081825256347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,4,1,power_law_1.2,0.491974401473999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,8,1,balanced,0.36655465761820477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,8,1,balanced,0.36849598089853924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,8,1,power_law_1.01,0.3153023958206177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,8,1,power_law_1.01,0.3197887897491455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,8,1,power_law_1.2,0.3184000015258789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,256,8,1,power_law_1.2,0.3321471929550171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,1,balanced,2.760197321573893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,1,balanced,2.7631734212239585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,1,power_law_1.01,2.0951488494873045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,1,power_law_1.01,2.1327999114990233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,1,power_law_1.2,2.0975872039794923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,1,power_law_1.2,2.104550361633301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,128,balanced,0.23166932662328085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,128,balanced,0.2320586641629537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,128,power_law_1.01,0.229369592666626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,128,power_law_1.01,0.22938880920410157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,128,power_law_1.2,0.22933759689331054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,128,power_law_1.2,0.22952959537506104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,16,balanced,0.37615466117858887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,16,balanced,0.3763360182444255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,16,power_law_1.01,0.3462464094161987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,16,power_law_1.01,0.365996789932251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,16,power_law_1.2,0.3456000089645386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,16,power_law_1.2,0.3471168041229248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,2,balanced,1.4516639709472656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,2,balanced,1.4738507270812988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,2,power_law_1.01,1.149120044708252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,2,power_law_1.01,1.2072064399719238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,2,power_law_1.2,1.146611213684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,2,power_law_1.2,1.2091391563415528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,32,balanced,0.29647467533747357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,32,balanced,0.2974933385848999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,32,power_law_1.01,0.28231039047241213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,32,power_law_1.01,0.2852031946182251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,32,power_law_1.2,0.27489280700683594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,32,power_law_1.2,0.2848448038101196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,4,balanced,0.8361066977183024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,4,balanced,0.8365493615468343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,4,power_law_1.01,0.701036787033081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,4,power_law_1.01,0.7122111797332764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,4,power_law_1.2,0.697279977798462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,4,power_law_1.2,0.7481919765472412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,64,balanced,0.2455893357594808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,64,balanced,0.24822932481765747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,64,power_law_1.01,0.24316799640655518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,64,power_law_1.01,0.24439680576324463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,64,power_law_1.2,0.24168319702148439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,64,power_law_1.2,0.24528000354766846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,8,balanced,0.5336106618245443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,8,balanced,0.534005324045817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,8,power_law_1.01,0.46735358238220215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,8,power_law_1.01,0.47827839851379395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,8,power_law_1.2,0.4569215774536133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,1,8,power_law_1.2,0.4725183963775635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,16,1,balanced,0.3741066853205363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,16,1,balanced,0.3742826779683431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,16,1,power_law_1.01,0.3340543985366821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,16,1,power_law_1.01,0.33457920551300047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,16,1,power_law_1.2,0.33272318840026854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,16,1,power_law_1.2,0.33556480407714845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,2,1,balanced,1.3671414057413738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,2,1,balanced,1.409861405690511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,2,1,power_law_1.01,1.0936511993408202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,2,1,power_law_1.01,1.1012288093566895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,2,1,power_law_1.2,1.0798784255981446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,2,1,power_law_1.2,1.0949631690979005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,32,1,balanced,0.31914667288462323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,32,1,balanced,0.319541335105896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,32,1,power_law_1.01,0.2858367919921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,32,1,power_law_1.01,0.2862272024154663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,32,1,power_law_1.2,0.27964799404144286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,32,1,power_law_1.2,0.28095359802246095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,4,1,balanced,0.7803466320037842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,4,1,balanced,0.7812373638153076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,4,1,power_law_1.01,0.6412864208221436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,4,1,power_law_1.01,0.6486080169677735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,4,1,power_law_1.2,0.6342463970184327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,4,1,power_law_1.2,0.6456704139709473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,8,1,balanced,0.5105760097503662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,8,1,balanced,0.5120693445205688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,8,1,power_law_1.01,0.4296256065368652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,8,1,power_law_1.01,0.4303743839263916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,8,1,power_law_1.2,0.4229887962341309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,192,7168,2048,8,384,8,1,power_law_1.2,0.42969598770141604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,1,balanced,0.03161066770553589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,1,balanced,0.034490667283535004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,1,power_law_1.01,0.03212159872055054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,1,power_law_1.01,0.032416000962257385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,1,power_law_1.2,0.032627201080322264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,1,power_law_1.2,0.033843201398849485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,128,balanced,0.02736533433198929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,128,balanced,0.02773333340883255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,128,power_law_1.01,0.026764801144599913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,128,power_law_1.01,0.02682879865169525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,128,power_law_1.2,0.026316800713539125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,128,power_law_1.2,0.026598399877548216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,16,balanced,0.02740799884001414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,16,balanced,0.027461332579453785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,16,power_law_1.01,0.030777600407600404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,16,power_law_1.01,0.03086079955101013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,16,power_law_1.2,0.02961919903755188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,16,power_law_1.2,0.030060800909996032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,2,balanced,0.03145600110292435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,2,balanced,0.03158933420976003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,2,power_law_1.01,0.03552640080451965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,2,power_law_1.01,0.03644160032272339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,2,power_law_1.2,0.0355648010969162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,2,power_law_1.2,0.03559040129184723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,32,balanced,0.027503999571005504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,32,balanced,0.029167999823888142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,32,power_law_1.01,0.02757120132446289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,32,power_law_1.01,0.027692800760269164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,32,power_law_1.2,0.028358399868011475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,32,power_law_1.2,0.02839039862155914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,4,balanced,0.029146666328112285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,4,balanced,0.02938133229811986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,4,power_law_1.01,0.03335680067539215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,4,power_law_1.01,0.0345984011888504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,4,power_law_1.2,0.03164800107479095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,4,power_law_1.2,0.032467201352119446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,64,balanced,0.02741866558790207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,64,balanced,0.027445333699385326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,64,power_law_1.01,0.026451200246810913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,64,power_law_1.01,0.027059200406074523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,64,power_law_1.2,0.027014398574829103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,64,power_law_1.2,0.027321600914001466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,8,balanced,0.02739733209212621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,8,balanced,0.02951466788848241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,8,power_law_1.01,0.030854400992393494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,8,power_law_1.01,0.030880001187324525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,8,power_law_1.2,0.02975359857082367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,1,8,power_law_1.2,0.03128319978713989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,2,1,balanced,0.02621866762638092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,2,1,balanced,0.027402666707833607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,2,1,power_law_1.01,0.026739200949668883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,2,1,power_law_1.01,0.027398398518562316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,2,1,power_law_1.2,0.026739200949668883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,2,1,power_law_1.2,0.027398398518562316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,4,1,balanced,0.02310933421055476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,4,1,balanced,0.025205334027608235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,4,1,power_law_1.01,0.023475199937820435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,4,1,power_law_1.01,0.023737600445747374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,4,1,power_law_1.2,0.02252800017595291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2048,768,8,128,4,1,power_law_1.2,0.0236735999584198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,1,balanced,0.05402666827042898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,1,balanced,0.05513066550095876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,1,power_law_1.01,0.05172479748725891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,1,power_law_1.01,0.05203840136528015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,1,power_law_1.2,0.05261440277099609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,1,power_law_1.2,0.05284479856491089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,128,balanced,0.0315786674618721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,128,balanced,0.03344533344109853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,128,power_law_1.01,0.03059839904308319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,128,power_law_1.01,0.030847999453544616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,128,power_law_1.2,0.030675199627876282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,128,power_law_1.2,0.031071999669075014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,16,balanced,0.03143999973932902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,16,balanced,0.031770666440327965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,16,power_law_1.01,0.04826239943504333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,16,power_law_1.01,0.050220799446105954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,16,power_law_1.2,0.04870400130748749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,16,power_law_1.2,0.04987519979476929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,2,balanced,0.043151999513308205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,2,balanced,0.04602666695912679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,2,power_law_1.01,0.05615360140800476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,2,power_law_1.01,0.05852800011634827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,2,power_law_1.2,0.05422080159187317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,2,power_law_1.2,0.05629439949989319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,32,balanced,0.03158933420976003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,32,balanced,0.033301333586374916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,32,power_law_1.01,0.0347135990858078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,32,power_law_1.01,0.035519999265670774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,32,power_law_1.2,0.03530240058898926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,32,power_law_1.2,0.03535360097885132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,4,balanced,0.036501333117485046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,4,balanced,0.03735466549793879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,4,power_law_1.01,0.057055997848510745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,4,power_law_1.01,0.057094401121139525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,4,power_law_1.2,0.04859519898891449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,4,power_law_1.2,0.05189120173454285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,64,balanced,0.031541332602500916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,64,balanced,0.033530667424201965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,64,power_law_1.01,0.03235200047492981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,64,power_law_1.01,0.032915198802948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,64,power_law_1.2,0.03283199965953827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,64,power_law_1.2,0.03351039886474609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,8,balanced,0.03352533280849457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,8,balanced,0.03543466577927271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,8,power_law_1.01,0.05553920269012451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,8,power_law_1.01,0.05737599730491638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,8,power_law_1.2,0.049804800748825075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,1,8,power_law_1.2,0.050367999076843264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,16,1,balanced,0.03942399968703588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,16,1,balanced,0.039861333866914116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,16,1,power_law_1.01,0.03758719861507416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,16,1,power_law_1.01,0.037939199805259706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,16,1,power_law_1.2,0.03790720105171204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,16,1,power_law_1.2,0.0379584014415741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,2,1,balanced,0.03664000084002813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,2,1,balanced,0.037765334049860634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,2,1,power_law_1.01,0.03551360070705414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,2,1,power_law_1.01,0.036959999799728395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,2,1,power_law_1.2,0.03733760118484497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,2,1,power_law_1.2,0.0377920001745224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,32,1,balanced,0.03825599948565165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,32,1,balanced,0.03961600114901861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,32,1,power_law_1.01,0.037503999471664426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,32,1,power_law_1.01,0.03772799968719483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,32,1,power_law_1.2,0.03692800104618073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,32,1,power_law_1.2,0.03823359906673431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,4,1,balanced,0.02957333376010259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,4,1,balanced,0.030239999294281006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,4,1,power_law_1.01,0.02773120105266571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,4,1,power_law_1.01,0.02810879945755005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,4,1,power_law_1.2,0.029420799016952513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,4,1,power_law_1.2,0.02996479868888855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,8,1,balanced,0.04186133543650309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,8,1,balanced,0.04322666426499685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,8,1,power_law_1.01,0.0403903990983963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,8,1,power_law_1.01,0.040575999021530154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,8,1,power_law_1.2,0.041388800740242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,2688,1856,6,128,8,1,power_law_1.2,0.04209280014038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,1,balanced,0.06382933259010315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,1,balanced,0.07835733393828075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,1,power_law_1.01,0.06166399717330932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,1,power_law_1.01,0.06219519972801209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,1,power_law_1.2,0.06295040249824524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,1,power_law_1.2,0.06388480067253113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,128,balanced,0.03194666653871536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,128,balanced,0.033359999457995095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,128,power_law_1.01,0.03020159900188446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,128,power_law_1.01,0.030316799879074097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,128,power_law_1.2,0.030054399371147157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,128,power_law_1.2,0.030937600135803222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,16,balanced,0.031541332602500916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,16,balanced,0.03162133445342382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,16,power_law_1.01,0.06719359755516052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,16,power_law_1.01,0.06935039758682252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,16,power_law_1.2,0.06892799735069274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,16,power_law_1.2,0.06952319741249084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,2,balanced,0.05570133527119955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,2,balanced,0.056015998125076294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,2,power_law_1.01,0.06787199974060058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,2,power_law_1.01,0.07131519913673401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,2,power_law_1.2,0.0648256003856659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,2,power_law_1.2,0.06895999908447266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,256,balanced,0.030618667602539062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,256,balanced,0.0332640012105306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,256,power_law_1.01,0.030297601222991945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,256,power_law_1.01,0.03041279911994934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,256,power_law_1.2,0.02998400032520294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,32,balanced,0.03162666658560435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,32,balanced,0.031727999448776245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,32,power_law_1.01,0.05139200091361999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,32,power_law_1.01,0.051667201519012454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,32,power_law_1.2,0.05025920271873474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,32,power_law_1.2,0.051692801713943484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,4,balanced,0.037658666570981346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,4,balanced,0.03790933390458425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,4,power_law_1.01,0.06811519861221313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,4,power_law_1.01,0.0692351996898651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,4,power_law_1.2,0.06624000072479248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,4,power_law_1.2,0.0664255976676941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,64,balanced,0.03149333347876867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,64,balanced,0.033344000577926636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,64,power_law_1.01,0.03430399894714355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,64,power_law_1.01,0.03495680093765259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,64,power_law_1.2,0.03468799889087677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,64,power_law_1.2,0.034995201230049136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,8,balanced,0.031983998914559685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,8,balanced,0.03244800120592117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,8,power_law_1.01,0.06753280162811279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,8,power_law_1.01,0.06883839964866638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,8,power_law_1.2,0.06721919775009155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,1,8,power_law_1.2,0.06748160123825073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,16,1,balanced,0.02532266577084859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,16,1,balanced,0.025519999365011852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,16,1,power_law_1.01,0.023705600202083586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,16,1,power_law_1.01,0.024198399484157564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,16,1,power_law_1.2,0.023686400055885314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,16,1,power_law_1.2,0.02385919988155365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,2,1,balanced,0.03972266614437103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,2,1,balanced,0.041482667128245033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,2,1,power_law_1.01,0.04101119935512543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,2,1,power_law_1.01,0.050944000482559204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,2,1,power_law_1.2,0.04216960072517395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,2,1,power_law_1.2,0.04243200123310089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,32,1,balanced,0.02515200028816859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,32,1,balanced,0.025674665967623394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,32,1,power_law_1.01,0.02325119972229004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,32,1,power_law_1.01,0.02452480047941208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,32,1,power_law_1.2,0.02380799949169159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,32,1,power_law_1.2,0.0243136003613472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,4,1,balanced,0.031248000760873158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,4,1,balanced,0.03128000100453695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,4,1,power_law_1.01,0.028729599714279175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,4,1,power_law_1.01,0.03153280019760132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,4,1,power_law_1.2,0.029049599170684816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,4,1,power_law_1.2,0.030124801397323608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,8,1,balanced,0.02717866748571396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,8,1,balanced,0.027376001079877216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,8,1,power_law_1.01,0.024851199984550477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,8,1,power_law_1.01,0.024979199469089507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,8,1,power_law_1.2,0.025011199712753295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,3072,1536,8,256,8,1,power_law_1.2,0.02542079985141754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,1,balanced,0.14987199505170187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,1,balanced,0.1509866714477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,1,power_law_1.01,0.14057600498199463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,1,power_law_1.01,0.14394880533218385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,1,power_law_1.2,0.14049919843673705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,1,power_law_1.2,0.14784640073776245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,2,balanced,0.11617599924405415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,2,balanced,0.12139733632405598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,2,power_law_1.01,0.09905920028686524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,2,power_law_1.01,0.11556479930877686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,2,power_law_1.2,0.11349760293960572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,2,power_law_1.2,0.13186559677124024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,4,balanced,0.08683199683825175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,4,balanced,0.09089600046475728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,4,power_law_1.01,0.09455360174179077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,4,power_law_1.01,0.09782400131225585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,4,power_law_1.2,0.08955519795417785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,4,power_law_1.2,0.11219199895858764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,8,balanced,0.08713600039482117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,8,balanced,0.09516800443331401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,8,power_law_1.01,0.08536959886550903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,8,power_law_1.01,0.08606079816818238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,8,power_law_1.2,0.08573439717292786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,1,8,power_law_1.2,0.08600959777832032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,16,1,balanced,0.029301332930723827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,16,1,balanced,0.0295413335164388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,16,1,power_law_1.01,0.030988800525665283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,16,1,power_law_1.01,0.03130879998207092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,16,1,power_law_1.2,0.028140801191329955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,16,1,power_law_1.2,0.029023998975753786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,2,1,balanced,0.09437867005666097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,2,1,balanced,0.09888000289599101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,2,1,power_law_1.01,0.08372480273246766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,2,1,power_law_1.01,0.08629119992256165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,2,1,power_law_1.2,0.08097919821739197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,2,1,power_law_1.2,0.08777599930763244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,32,1,balanced,0.02770666778087616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,32,1,balanced,0.02906133234500885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,32,1,power_law_1.01,0.026470398902893065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,32,1,power_law_1.01,0.026521599292755126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,32,1,power_law_1.2,0.02632319927215576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,32,1,power_law_1.2,0.02656640112400055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,4,1,balanced,0.05823466678460439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,4,1,balanced,0.0588319996992747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,4,1,power_law_1.01,0.05127679705619812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,4,1,power_law_1.01,0.05324800014495849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,4,1,power_law_1.2,0.05170559883117676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,4,1,power_law_1.2,0.051769602298736575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,8,1,balanced,0.039850667119026184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,8,1,balanced,0.0415040006240209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,8,1,power_law_1.01,0.037190398573875426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,8,1,power_law_1.01,0.03749760091304779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,8,1,power_law_1.2,0.03749760091304779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,14336,2,8,8,1,power_law_1.2,0.04095999896526337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,1,balanced,0.07589333256085713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,1,balanced,0.07755733529726665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,1,power_law_1.01,0.07417600154876709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,1,power_law_1.01,0.0745024025440216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,1,power_law_1.2,0.07742720246315002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,1,power_law_1.2,0.08231679797172546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,128,balanced,0.031658666829268135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,128,balanced,0.03376533339420954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,128,power_law_1.01,0.03245440125465393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,128,power_law_1.01,0.03247359991073608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,128,power_law_1.2,0.03172479867935181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,128,power_law_1.2,0.031974399089813234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,16,balanced,0.03364266703526179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,16,balanced,0.033701332906881966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,16,power_law_1.01,0.0571008026599884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,16,power_law_1.01,0.057792001962661745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,16,power_law_1.2,0.052313601970672606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,16,power_law_1.2,0.05426560044288635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,2,balanced,0.058005332946777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,2,balanced,0.060906668504079185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,2,power_law_1.01,0.06586880087852479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,2,power_law_1.01,0.06928640007972717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,2,power_law_1.2,0.06425600051879883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,2,power_law_1.2,0.0706496000289917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,32,balanced,0.03347733368476232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,32,balanced,0.03365333378314972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,32,power_law_1.01,0.03863680064678192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,32,power_law_1.01,0.038950398564338684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,32,power_law_1.2,0.0392192006111145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,32,power_law_1.2,0.03935360014438629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,4,balanced,0.04185600082079569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,4,balanced,0.042261332273483276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,4,power_law_1.01,0.06629760265350342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,4,power_law_1.01,0.06951680183410644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,4,power_law_1.2,0.06047999858856201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,4,power_law_1.2,0.06250240206718445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,64,balanced,0.03327466547489166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,64,balanced,0.03342933456103007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,64,power_law_1.01,0.033548799157142636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,64,power_law_1.01,0.03375999927520752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,64,power_law_1.2,0.03320319950580597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,64,power_law_1.2,0.03369599878787995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,8,balanced,0.03376533339420954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,8,balanced,0.03558400024970373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,8,power_law_1.01,0.057734400033950806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,8,power_law_1.01,0.06321920156478882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,8,power_law_1.2,0.05596799850463867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,1,8,power_law_1.2,0.05822719931602478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,16,1,balanced,0.027232001225153606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,16,1,balanced,0.02757333219051361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,16,1,power_law_1.01,0.02659200131893158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,16,1,power_law_1.01,0.02678399980068207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,16,1,power_law_1.2,0.02651520073413849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,16,1,power_law_1.2,0.02717440128326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,2,1,balanced,0.05050666630268097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,2,1,balanced,0.05089066425959269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,2,1,power_law_1.01,0.04916479885578155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,2,1,power_law_1.01,0.049568000435829165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,2,1,power_law_1.2,0.04963839948177338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,2,1,power_law_1.2,0.05002880096435547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,32,1,balanced,0.027237333357334137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,32,1,balanced,0.02752000093460083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,32,1,power_law_1.01,0.02587519884109497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,32,1,power_law_1.01,0.02661119997501373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,32,1,power_law_1.2,0.025382399559020996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,32,1,power_law_1.2,0.026035198569297792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,4,1,balanced,0.03526400029659271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,4,1,balanced,0.0355679988861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,4,1,power_law_1.01,0.035750401020050046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,4,1,power_law_1.01,0.03615359961986542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,4,1,power_law_1.2,0.036396801471710205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,4,1,power_law_1.2,0.03675520122051239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,8,1,balanced,0.02959999938805898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,8,1,balanced,0.030389333764712017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,8,1,power_law_1.01,0.030649599432945252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,8,1,power_law_1.01,0.03088639974594116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,8,1,power_law_1.2,0.030687999725341798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,1536,8,128,8,1,power_law_1.2,0.032262399792671204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,1,balanced,0.25917333364486694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,1,balanced,0.2601173321406047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,1,power_law_1.01,0.25486719608306885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,1,power_law_1.01,0.25628159046173093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,1,power_law_1.2,0.2560256004333496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,1,power_law_1.2,0.2572160005569458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,128,balanced,0.03774400055408478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,128,balanced,0.038912000755469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,128,power_law_1.01,0.057081598043441775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,128,power_law_1.01,0.05848960280418396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,128,power_law_1.2,0.057222402095794676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,128,power_law_1.2,0.05802239775657654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,16,balanced,0.05783999959627787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,16,balanced,0.05807466804981232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,16,power_law_1.01,0.20509440898895265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,16,power_law_1.01,0.20511360168457032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,16,power_law_1.2,0.1828927993774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,16,power_law_1.2,0.1839679956436157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,2,balanced,0.16102932890256247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,2,balanced,0.16221333543459573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,2,power_law_1.01,0.2617216110229492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,2,power_law_1.01,0.26236801147460936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,2,power_law_1.2,0.2302016019821167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,2,power_law_1.2,0.2412287950515747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,256,balanced,0.03762666632731756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,256,balanced,0.03798400113979975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,256,power_law_1.01,0.04161919951438904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,256,power_law_1.01,0.04216319918632507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,256,power_law_1.2,0.041388800740242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,256,power_law_1.2,0.04213759899139404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,32,balanced,0.05297600229581197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,32,balanced,0.05381333331267039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,32,power_law_1.01,0.1322111964225769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,32,power_law_1.01,0.13226879835128785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,32,power_law_1.2,0.13218560218811035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,32,power_law_1.2,0.13233280181884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,4,balanced,0.1046453317006429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,4,balanced,0.10654933253924052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,4,power_law_1.01,0.2622783899307251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,4,power_law_1.01,0.2626879930496216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,4,power_law_1.2,0.19752960205078124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,4,power_law_1.2,0.21210238933563233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,64,balanced,0.04387733340263367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,64,balanced,0.045642669002215065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,64,power_law_1.01,0.07579519748687744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,64,power_law_1.01,0.07838720083236694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,64,power_law_1.2,0.07660800218582153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,64,power_law_1.2,0.07719039916992188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,8,balanced,0.0720960001150767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,8,balanced,0.07388799885908763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,8,power_law_1.01,0.2605887889862061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,8,power_law_1.01,0.26163198947906496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,8,power_law_1.2,0.18339200019836427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,1,8,power_law_1.2,0.20483839511871338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,16,1,balanced,0.1338986655076345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,16,1,balanced,0.1357599993546804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,16,1,power_law_1.01,0.12976640462875366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,16,1,power_law_1.01,0.1315392017364502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,16,1,power_law_1.2,0.13470720052719115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,16,1,power_law_1.2,0.13544960021972657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,2,1,balanced,0.14412800470987955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,2,1,balanced,0.1441333293914795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,2,1,power_law_1.01,0.14203519821166993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,2,1,power_law_1.01,0.1420799970626831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,2,1,power_law_1.2,0.14219520092010499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,2,1,power_law_1.2,0.1431167960166931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,32,1,balanced,0.11351466178894043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,32,1,balanced,0.11512000362078349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,32,1,power_law_1.01,0.11107840538024902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,32,1,power_law_1.01,0.11183359622955322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,32,1,power_law_1.2,0.11489280462265014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,32,1,power_law_1.2,0.11605119705200195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,4,1,balanced,0.09475200374921162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,4,1,balanced,0.09698133667310078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,4,1,power_law_1.01,0.09363200068473816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,4,1,power_law_1.01,0.09384959936141968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,4,1,power_law_1.2,0.09370880126953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,4,1,power_law_1.2,0.09489920139312744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,8,1,balanced,0.06345599889755249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,8,1,balanced,0.0703893353541692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,8,1,power_law_1.01,0.060134398937225345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,8,1,power_law_1.01,0.06116480231285095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,8,1,power_law_1.2,0.0607807993888855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,4096,2688,22,512,8,1,power_law_1.2,0.061536002159118655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,1,balanced,0.23767467339833578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,1,balanced,0.247381329536438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,1,power_law_1.01,0.20774400234222412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,1,power_law_1.01,0.21107840538024902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,1,power_law_1.2,0.1761023998260498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,1,power_law_1.2,0.20171520709991456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,2,balanced,0.15337600310643515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,2,balanced,0.1665279964605967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,2,power_law_1.01,0.13482880592346191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,2,power_law_1.01,0.16184959411621094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,2,power_law_1.2,0.15941760540008545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,2,power_law_1.2,0.16314239501953126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,4,balanced,0.1258133351802826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,4,balanced,0.13290666540463766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,4,power_law_1.01,0.12693120241165162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,4,power_law_1.01,0.1404863953590393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,4,power_law_1.2,0.13509119749069215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,4,power_law_1.2,0.14179199934005737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,8,balanced,0.11168533563613892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,8,balanced,0.11497599879900615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,8,power_law_1.01,0.10999679565429688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,8,power_law_1.01,0.11072640419006348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,8,power_law_1.2,0.11092480421066284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,1,8,power_law_1.2,0.11131520271301269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,16,1,balanced,0.038245332737763725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,16,1,balanced,0.04160533348719279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,16,1,power_law_1.01,0.039654400944709775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,16,1,power_law_1.01,0.04058879911899567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,16,1,power_law_1.2,0.040217599272727965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,16,1,power_law_1.2,0.040268799662590025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,2,1,balanced,0.13664000233014426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,2,1,balanced,0.14415466785430908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,2,1,power_law_1.01,0.11071360111236572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,2,1,power_law_1.01,0.11855360269546508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,2,1,power_law_1.2,0.10656640529632569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,2,1,power_law_1.2,0.1310912013053894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,32,1,balanced,0.03338133295377096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,32,1,balanced,0.03536533315976461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,32,1,power_law_1.01,0.032576000690460204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,32,1,power_law_1.01,0.03281280100345611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,32,1,power_law_1.2,0.03192960023880005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,32,1,power_law_1.2,0.03260799944400787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,4,1,balanced,0.08261333405971527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,4,1,balanced,0.09430932998657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,4,1,power_law_1.01,0.07162879705429077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,4,1,power_law_1.01,0.07255679965019227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,4,1,power_law_1.2,0.07669119834899903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,4,1,power_law_1.2,0.08655359745025634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,8,1,balanced,0.061466669042905174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,8,1,balanced,0.06371733546257019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,8,1,power_law_1.01,0.051052802801132204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,8,1,power_law_1.01,0.052723199129104614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,8,1,power_law_1.2,0.051577597856521606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,16384,2,8,8,1,power_law_1.2,0.05379199981689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,1,balanced,0.13165332873662314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,1,balanced,0.14342400431632996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,1,power_law_1.01,0.13141119480133057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,1,power_law_1.01,0.131769597530365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,1,power_law_1.2,0.13184640407562256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,1,power_law_1.2,0.13308800458908082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,128,balanced,0.03734400123357773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,128,balanced,0.03756800045569738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,128,power_law_1.01,0.042771199345588685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,128,power_law_1.01,0.04292480051517487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,128,power_law_1.2,0.04318079948425293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,128,power_law_1.2,0.04334079921245575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,16,balanced,0.03770666569471359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,16,balanced,0.03791466603676478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,16,power_law_1.01,0.13610880374908446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,16,power_law_1.01,0.13713279962539673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,16,power_law_1.2,0.1336959958076477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,16,power_law_1.2,0.1362944006919861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,2,balanced,0.08589333295822144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,2,balanced,0.08852799733479817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,2,power_law_1.01,0.13684480190277098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,2,power_law_1.01,0.1391808032989502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,2,power_law_1.2,0.1341312050819397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,2,power_law_1.2,0.14008320569992067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,256,balanced,0.037621334195137024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,256,balanced,0.0377866675456365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,256,power_law_1.01,0.03619840145111084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,256,power_law_1.01,0.03696640133857727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,256,power_law_1.2,0.03688960075378418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,256,power_law_1.2,0.036959999799728395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,32,balanced,0.03765333443880081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,32,balanced,0.03766400118668874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,32,power_law_1.01,0.08068479895591736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,32,power_law_1.01,0.08376960158348083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,32,power_law_1.2,0.08307200074195861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,32,power_law_1.2,0.08312320113182067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,4,balanced,0.06392533580462138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,4,balanced,0.0703893353541692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,4,power_law_1.01,0.13674880266189576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,4,power_law_1.01,0.13904000520706178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,4,power_law_1.2,0.13696639537811278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,4,power_law_1.2,0.14060800075531005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,64,balanced,0.03772799919048945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,64,balanced,0.03781333317359289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,64,power_law_1.01,0.061913597583770755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,64,power_law_1.01,0.06335359811782837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,64,power_law_1.2,0.06228479743003845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,64,power_law_1.2,0.0630016028881073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,8,balanced,0.0454773356517156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,8,balanced,0.04593066871166229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,8,power_law_1.01,0.1359935998916626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,8,power_law_1.01,0.1361855983734131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,8,power_law_1.2,0.130950403213501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,1,8,power_law_1.2,0.13150080442428588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,16,1,balanced,0.033514666060606636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,16,1,balanced,0.03383466601371765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,16,1,power_law_1.01,0.03130879998207092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,16,1,power_law_1.01,0.03177599906921387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,16,1,power_law_1.2,0.03108479976654053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,16,1,power_law_1.2,0.03153280019760132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,2,1,balanced,0.07784533500671387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,2,1,balanced,0.07868266602357228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,2,1,power_law_1.01,0.07491840124130249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,2,1,power_law_1.01,0.07585920095443725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,2,1,power_law_1.2,0.0754047989845276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,2,1,power_law_1.2,0.07587839961051941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,32,1,balanced,0.03356266766786575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,32,1,balanced,0.033626665671666466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,32,1,power_law_1.01,0.03157120048999786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,32,1,power_law_1.01,0.03185279965400696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,32,1,power_law_1.2,0.03128319978713989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,32,1,power_law_1.2,0.031763198971748355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,4,1,balanced,0.05333866675694784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,4,1,balanced,0.05630933245023092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,4,1,power_law_1.01,0.053913599252700804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,4,1,power_law_1.01,0.0580672025680542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,4,1,power_law_1.2,0.05356799960136414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,4,1,power_law_1.2,0.053855997323989865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,8,1,balanced,0.03772266705830892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,8,1,balanced,0.0407679999868075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,8,1,power_law_1.01,0.03335680067539215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,8,1,power_law_1.01,0.034176000952720643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,8,1,power_law_1.2,0.035750401020050046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2048,8,256,8,1,power_law_1.2,0.03670400083065033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,1,balanced,0.15921066204706827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,1,balanced,0.15945067008336386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,1,power_law_1.01,0.15998719930648803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,1,power_law_1.01,0.16030720472335816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,1,power_law_1.2,0.15864959955215455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,1,power_law_1.2,0.16021759510040284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,16,balanced,0.03875733415285746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,16,balanced,0.03974399964014689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,16,power_law_1.01,0.11544320583343506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,16,power_law_1.01,0.1164031982421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,16,power_law_1.2,0.10241919755935669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,16,power_law_1.2,0.1085055947303772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,2,balanced,0.0999679962793986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,2,balanced,0.10032000144322713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,2,power_law_1.01,0.15565439462661743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,2,power_law_1.01,0.15707520246505738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,2,power_law_1.2,0.12458879947662353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,2,power_law_1.2,0.13553919792175292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,32,balanced,0.039503999054431915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,32,balanced,0.03979199876387914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,32,power_law_1.01,0.07248640060424805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,32,power_law_1.01,0.07289599776268005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,32,power_law_1.2,0.07164160013198853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,32,power_law_1.2,0.07219840288162231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,4,balanced,0.06891199946403503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,4,balanced,0.07838400204976399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,4,power_law_1.01,0.15251840353012086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,4,power_law_1.01,0.15263359546661376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,4,power_law_1.2,0.11312639713287354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,4,power_law_1.2,0.12510720491409302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,8,balanced,0.04852266609668732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,8,balanced,0.0498879998922348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,8,power_law_1.01,0.15419520139694215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,8,power_law_1.01,0.15433599948883056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,8,power_law_1.2,0.1086016058921814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,1,8,power_law_1.2,0.11984000205993653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,16,1,balanced,0.03525333354870478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,16,1,balanced,0.03570666660865148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,16,1,power_law_1.01,0.03701759874820709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,16,1,power_law_1.01,0.037676799297332766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,16,1,power_law_1.2,0.03856639862060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,16,1,power_law_1.2,0.039961600303649904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,2,1,balanced,0.0886400043964386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,2,1,balanced,0.08947733044624329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,2,1,power_law_1.01,0.08724480271339416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,2,1,power_law_1.01,0.08765439987182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,2,1,power_law_1.2,0.08698239922523499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,2,1,power_law_1.2,0.08776320219039917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,32,1,balanced,0.03309333324432373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,32,1,balanced,0.033200000723203026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,32,1,power_law_1.01,0.031865599751472476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,32,1,power_law_1.01,0.031948798894882204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,32,1,power_law_1.2,0.03258239924907684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,32,1,power_law_1.2,0.034720000624656674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,4,1,balanced,0.06187200049559275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,4,1,balanced,0.06202666461467743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,4,1,power_law_1.01,0.0597760021686554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,4,1,power_law_1.01,0.06295679807662964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,4,1,power_law_1.2,0.05942400097846985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,4,1,power_law_1.2,0.05980160236358643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,8,1,balanced,0.04590400060017904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,8,1,balanced,0.04753066599369049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,8,1,power_law_1.01,0.045126399397850035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,8,1,power_law_1.01,0.04572800099849701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,8,1,power_law_1.2,0.045817598700523376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,6144,2560,8,160,8,1,power_law_1.2,0.04613119959831238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,1,balanced,0.14250133434931436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,1,balanced,0.14627733826637268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,1,power_law_1.01,0.14113919734954833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,1,power_law_1.01,0.1422271966934204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,1,power_law_1.2,0.1424512028694153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,1,power_law_1.2,0.14263039827346802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,128,balanced,0.03978666663169861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,128,balanced,0.041696002086003624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,128,power_law_1.01,0.04684160053730011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,128,power_law_1.01,0.04835839867591858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,128,power_law_1.2,0.04636160135269165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,128,power_law_1.2,0.049292799830436704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,16,balanced,0.04064533362785975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,16,balanced,0.04161066561937332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,16,power_law_1.01,0.14817919731140136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,16,power_law_1.01,0.15041919946670532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,16,power_law_1.2,0.14659839868545532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,16,power_law_1.2,0.14692480564117433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,2,balanced,0.09286399682362874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,2,balanced,0.09455999732017517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,2,power_law_1.01,0.14833279848098754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,2,power_law_1.01,0.14911999702453613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,2,power_law_1.2,0.14842239618301392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,2,power_law_1.2,0.1573184013366699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,256,balanced,0.03995733211437861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,256,balanced,0.041690667470296226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,256,power_law_1.01,0.0395904004573822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,256,power_law_1.01,0.040294399857521056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,256,power_law_1.2,0.03941119909286499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,256,power_law_1.2,0.039750400185585025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,32,balanced,0.041434665520985924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,32,balanced,0.041573333243529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,32,power_law_1.01,0.09174399971961975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,32,power_law_1.01,0.092467200756073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,32,power_law_1.2,0.09048960208892823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,32,power_law_1.2,0.0913536012172699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,4,balanced,0.0776693324247996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,4,balanced,0.091648002465566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,4,power_law_1.01,0.14859520196914672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,4,power_law_1.01,0.15096319913864137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,4,power_law_1.2,0.14364800453186036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,4,power_law_1.2,0.14467840194702147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,64,balanced,0.040896000961462654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,64,balanced,0.04148799926042557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,64,power_law_1.01,0.06661760210990905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,64,power_law_1.01,0.0670527994632721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,64,power_law_1.2,0.06600959897041321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,64,power_law_1.2,0.06711680293083191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,8,balanced,0.05213333169619242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,8,balanced,0.06214400132497152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,8,power_law_1.01,0.14839040040969848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,8,power_law_1.01,0.15433599948883056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,8,power_law_1.2,0.14905600547790526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,1,8,power_law_1.2,0.15021439790725707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,16,1,balanced,0.035599999129772186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,16,1,balanced,0.03571200122435888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,16,1,power_law_1.01,0.033983999490737916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,16,1,power_law_1.01,0.03456639945507049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,16,1,power_law_1.2,0.034016001224517825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,16,1,power_law_1.2,0.034246399998664856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,2,1,balanced,0.08334933718045552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,2,1,balanced,0.0848640004793803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,2,1,power_law_1.01,0.08149759769439698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,2,1,power_law_1.01,0.08217599987983704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,2,1,power_law_1.2,0.08257279992103576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,2,1,power_law_1.2,0.08266239762306213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,32,1,balanced,0.03534399966398875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,32,1,balanced,0.03555200000603994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,32,1,power_law_1.01,0.033555200695991515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,32,1,power_law_1.01,0.03363839983940124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,32,1,power_law_1.2,0.03315199911594391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,32,1,power_law_1.2,0.03342719972133636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,4,1,balanced,0.0599839985370636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,4,1,balanced,0.06016000111897787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,4,1,power_law_1.01,0.06017919778823853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,4,1,power_law_1.01,0.0627135992050171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,4,1,power_law_1.2,0.058483201265335086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,4,1,power_law_1.2,0.060499197244644164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,8,1,balanced,0.04608533283074697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,8,1,balanced,0.047882666190465294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,8,1,power_law_1.01,0.0392767995595932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,8,1,power_law_1.01,0.04147840142250061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,8,1,power_law_1.2,0.03978239893913269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,256,8,1,power_law_1.2,0.04015359878540039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,1,balanced,0.14282666643460593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,1,balanced,0.1460533340771993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,1,power_law_1.01,0.14172159433364867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,1,power_law_1.01,0.14361599683761597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,1,power_law_1.2,0.14090240001678467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,1,power_law_1.2,0.14218239784240722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,128,balanced,0.041696002086003624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,128,balanced,0.041722665230433144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,128,power_law_1.01,0.057817602157592775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,128,power_law_1.01,0.05834239721298218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,128,power_law_1.2,0.058143997192382814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,128,power_law_1.2,0.05975679755210876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,16,balanced,0.04025600105524063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,16,balanced,0.04181333382924398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,16,power_law_1.01,0.14818559885025023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,16,power_law_1.01,0.14995839595794677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,16,power_law_1.2,0.14823039770126342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,16,power_law_1.2,0.15223679542541504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,2,balanced,0.09422399600346883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,2,balanced,0.09488532940546672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,2,power_law_1.01,0.14883840084075928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,2,power_law_1.01,0.15018880367279053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,2,power_law_1.2,0.1502784013748169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,2,power_law_1.2,0.1506943941116333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,32,balanced,0.04154666761557261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,32,balanced,0.04179200033346812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,32,power_law_1.01,0.12617599964141846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,32,power_law_1.01,0.12647680044174195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,32,power_law_1.2,0.12655359506607056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,32,power_law_1.2,0.12673920392990112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,4,balanced,0.06850133339564006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,4,balanced,0.07042133311430614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,4,power_law_1.01,0.14970879554748534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,4,power_law_1.01,0.15160319805145264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,4,power_law_1.2,0.14944640398025513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,4,power_law_1.2,0.15140479803085327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,64,balanced,0.04170133173465729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,64,balanced,0.04180799921353658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,64,power_law_1.01,0.07783679962158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,64,power_law_1.01,0.08009600043296813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,64,power_law_1.2,0.07774720191955567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,64,power_law_1.2,0.08023679852485657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,8,balanced,0.0496319979429245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,8,balanced,0.049925332268079124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,8,power_law_1.01,0.14866559505462645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,8,power_law_1.01,0.14999680519104003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,8,power_law_1.2,0.14892159700393676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,1,8,power_law_1.2,0.15175679922103882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,16,1,balanced,0.03530666728814443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,16,1,balanced,0.03533866753180822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,16,1,power_law_1.01,0.03370240032672882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,16,1,power_law_1.01,0.03381119966506958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,16,1,power_law_1.2,0.03338240087032318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,16,1,power_law_1.2,0.03400320112705231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,2,1,balanced,0.08403199911117554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,2,1,balanced,0.08508267005284627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,2,1,power_law_1.01,0.08671360015869141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,2,1,power_law_1.01,0.09472640156745911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,2,1,power_law_1.2,0.08183040022850037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,2,1,power_law_1.2,0.08194559812545776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,32,1,balanced,0.03544000039498011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,32,1,balanced,0.035530666510264076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,32,1,power_law_1.01,0.033529600501060484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,32,1,power_law_1.01,0.03391999900341034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,32,1,power_law_1.2,0.033542400598526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,32,1,power_law_1.2,0.03403519988059998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,4,1,balanced,0.058261334896087646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,4,1,balanced,0.05985066791375478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,4,1,power_law_1.01,0.05813760161399841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,4,1,power_law_1.01,0.06513919830322265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,4,1,power_law_1.2,0.05768960118293762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,4,1,power_law_1.2,0.05816320180892944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,8,1,balanced,0.04348266621430715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,8,1,balanced,0.04377600053946177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,8,1,power_law_1.01,0.04110719859600067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,8,1,power_law_1.01,0.04142079949378967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,8,1,power_law_1.2,0.03993600010871887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2,7168,2048,8,384,8,1,power_law_1.2,0.04175359904766083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,1,balanced,0.26498667399088544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,1,balanced,0.26549333333969116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,1,power_law_1.01,0.31710081100463866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,1,power_law_1.01,0.32062079906463625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,1,power_law_1.2,0.32636799812316897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,1,power_law_1.2,0.3270911931991577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,128,balanced,0.14611732959747314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,128,balanced,0.14642666776974997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,128,power_law_1.01,0.1497215986251831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,128,power_law_1.01,0.15224319696426392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,128,power_law_1.2,0.15324800014495848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,128,power_law_1.2,0.1535104036331177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,16,balanced,0.15262933572133383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,16,balanced,0.1529706617196401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,16,power_law_1.01,0.1656448006629944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,16,power_law_1.01,0.1667904019355774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,16,power_law_1.2,0.1678272008895874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,16,power_law_1.2,0.17161600589752196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,2,balanced,0.218341330687205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,2,balanced,0.21921600898106894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,2,power_law_1.01,0.25304958820343015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,2,power_law_1.01,0.25319681167602537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,2,power_law_1.2,0.2573568105697632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,2,power_law_1.2,0.2587455987930298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,32,balanced,0.14830933014551798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,32,balanced,0.1492693324883779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,32,power_law_1.01,0.15532159805297852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,32,power_law_1.01,0.1562880039215088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,32,power_law_1.2,0.16168320178985596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,32,power_law_1.2,0.1619647979736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,4,balanced,0.1851039926211039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,4,balanced,0.18625066677729288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,4,power_law_1.01,0.2050879955291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,4,power_law_1.01,0.2075711965560913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,4,power_law_1.2,0.2121216058731079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,4,power_law_1.2,0.21219840049743652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,64,balanced,0.14752533038457236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,64,balanced,0.1479146679242452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,64,power_law_1.01,0.15119359493255616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,64,power_law_1.01,0.15167360305786132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,64,power_law_1.2,0.15507199764251708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,64,power_law_1.2,0.15751680135726928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,8,balanced,0.1646719972292582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,8,balanced,0.164682666460673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,8,power_law_1.01,0.18001279830932618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,8,power_law_1.01,0.18071039915084838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,8,power_law_1.2,0.18260480165481568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,1,8,power_law_1.2,0.18440959453582764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,2,1,balanced,0.19013333320617676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,2,1,balanced,0.19167999426523843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,2,1,power_law_1.01,0.22539520263671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,2,1,power_law_1.01,0.22613120079040527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,2,1,power_law_1.2,0.22860159873962402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,2,1,power_law_1.2,0.23129599094390868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,4,1,balanced,0.15959466497103372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,4,1,balanced,0.1630453368028005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,4,1,power_law_1.01,0.1869312047958374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,4,1,power_law_1.01,0.18765439987182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,4,1,power_law_1.2,0.19084800481796266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2048,768,8,128,4,1,power_law_1.2,0.1912384033203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,1,balanced,0.5396480162938436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,1,balanced,0.5447573264439901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,1,power_law_1.01,0.6291327953338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,1,power_law_1.01,0.6310976028442383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,1,power_law_1.2,0.6446335792541504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,1,power_law_1.2,0.6521728038787842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,128,balanced,0.18884267409642538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,128,balanced,0.1893813411394755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,128,power_law_1.01,0.19498879909515382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,128,power_law_1.01,0.19827840328216553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,128,power_law_1.2,0.20760319232940674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,128,power_law_1.2,0.20896000862121583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,16,balanced,0.21583465735117593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,16,balanced,0.21633066733678183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,16,power_law_1.01,0.2307647943496704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,16,power_law_1.01,0.23469440937042235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,16,power_law_1.2,0.24375040531158448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,16,power_law_1.2,0.24681599140167237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,2,balanced,0.3853600025177002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,2,balanced,0.3853973150253296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,2,power_law_1.01,0.43636479377746584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,2,power_law_1.01,0.44748802185058595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,2,power_law_1.2,0.44725761413574217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,2,power_law_1.2,0.4555200099945068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,32,balanced,0.19686400890350342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,32,balanced,0.19798932472864786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,32,power_law_1.01,0.21349759101867677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,32,power_law_1.01,0.21546239852905275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,32,power_law_1.2,0.21867520809173585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,32,power_law_1.2,0.2233664035797119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,4,balanced,0.29364800453186035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,4,balanced,0.2964106599489848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,4,power_law_1.01,0.32702720165252686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,4,power_law_1.01,0.32936959266662597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,4,power_law_1.2,0.33489279747009276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,4,power_law_1.2,0.34235520362854005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,64,balanced,0.1919999917348226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,64,balanced,0.19288533926010132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,64,power_law_1.01,0.203603196144104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,64,power_law_1.01,0.20848639011383058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,64,power_law_1.2,0.2099839925765991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,64,power_law_1.2,0.21016960144042968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,8,balanced,0.24454933404922485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,8,power_law_1.01,0.26963200569152834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,8,power_law_1.01,0.2730815887451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,8,power_law_1.2,0.27203199863433836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,1,8,power_law_1.2,0.2783168077468872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,16,1,balanced,0.8260533014933268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,16,1,balanced,0.8276267051696777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,16,1,power_law_1.01,1.1306303977966308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,16,1,power_law_1.01,1.1315135955810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,16,1,power_law_1.2,1.1703359603881835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,16,1,power_law_1.2,1.1772671699523927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,2,1,balanced,0.34139732519785565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,2,1,balanced,0.341536005338033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,2,1,power_law_1.01,0.39777920246124265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,2,1,power_law_1.01,0.3981568098068237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,2,1,power_law_1.2,0.4035647869110107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,2,1,power_law_1.2,0.4105855941772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,32,1,balanced,0.7153226534525553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,32,1,balanced,0.716602643330892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,32,1,power_law_1.01,0.9922687530517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,32,1,power_law_1.01,1.0005951881408692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,32,1,power_law_1.2,1.002943992614746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,32,1,power_law_1.2,1.0221568107604981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,4,1,balanced,0.2409013311068217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,4,1,balanced,0.24388800064722696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,4,1,power_law_1.01,0.272652792930603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,4,1,power_law_1.01,0.27774078845977784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,4,1,power_law_1.2,0.28587520122528076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,4,1,power_law_1.2,0.2867072105407715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,8,1,balanced,1.1284586588541667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,8,1,balanced,1.1656373341878254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,8,1,power_law_1.01,1.5006208419799805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,8,1,power_law_1.01,1.5337920188903809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,8,1,power_law_1.2,1.591001605987549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,2688,1856,6,128,8,1,power_law_1.2,1.596127986907959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,1,balanced,0.8827679951985677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,1,balanced,0.8991946379343668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,1,power_law_1.01,0.9459136009216309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,1,power_law_1.01,0.9591872215270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,1,power_law_1.2,0.9862336158752442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,1,power_law_1.2,1.0019647598266601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,128,balanced,0.248906672000885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,128,balanced,0.25064533948898315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,128,power_law_1.01,0.256710410118103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,128,power_law_1.01,0.2568511962890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,128,power_law_1.2,0.26051840782165525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,128,power_law_1.2,0.2628544092178345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,16,balanced,0.2904319961865743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,16,balanced,0.2913600007692973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,16,power_law_1.01,0.3095616102218628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,16,power_law_1.01,0.310534405708313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,16,power_law_1.2,0.31201279163360596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,16,power_law_1.2,0.31315200328826903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,2,balanced,0.585973342259725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,2,balanced,0.586026668548584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,2,power_law_1.01,0.6253312110900879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,2,power_law_1.01,0.6274496078491211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,2,power_law_1.2,0.6292223930358887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,2,power_law_1.2,0.6588096141815185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,256,balanced,0.24659200509389242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,256,balanced,0.24665600061416626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,256,power_law_1.01,0.2518656015396118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,256,power_law_1.01,0.2522304058074951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,256,power_law_1.2,0.25598080158233644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,256,power_law_1.2,0.25657598972320556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,32,balanced,0.2651253342628479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,32,balanced,0.2651626666386922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,32,power_law_1.01,0.27857921123504636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,32,power_law_1.01,0.2789504051208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,32,power_law_1.2,0.2848128080368042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,32,power_law_1.2,0.28577280044555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,4,balanced,0.42238398392995197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,4,balanced,0.42441598574320477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,4,power_law_1.01,0.44890241622924804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,4,power_law_1.01,0.4512639999389648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,4,power_law_1.2,0.45470080375671384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,4,power_law_1.2,0.4573376178741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,64,balanced,0.2529226740201314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,64,balanced,0.25356266895929974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,64,power_law_1.01,0.2645440101623535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,64,power_law_1.01,0.2646591901779175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,64,power_law_1.2,0.2667455911636353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,64,power_law_1.2,0.2696768045425415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,8,balanced,0.333957314491272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,8,balanced,0.33607999483744305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,8,power_law_1.01,0.3540287971496582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,8,power_law_1.01,0.3546560049057007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,8,power_law_1.2,0.36373119354248046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,1,8,power_law_1.2,0.36561279296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,16,1,balanced,0.24885332584381104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,16,1,balanced,0.2491146723429362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,16,1,power_law_1.01,0.27555840015411376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,16,1,power_law_1.01,0.2790208101272583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,16,1,power_law_1.2,0.28132479190826415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,16,1,power_law_1.2,0.2823807954788208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,2,1,balanced,0.5361866553624471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,2,1,balanced,0.5369760195414225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,2,1,power_law_1.01,0.5750271797180175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,2,1,power_law_1.01,0.576204776763916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,2,1,power_law_1.2,0.597049617767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,2,1,power_law_1.2,0.6022848129272461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,32,1,balanced,0.2280799945195516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,32,1,balanced,0.22817067305246988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,32,1,power_law_1.01,0.25585920810699464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,32,1,power_law_1.01,0.2574847936630249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,32,1,power_law_1.2,0.260153603553772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,32,1,power_law_1.2,0.2610752105712891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,4,1,balanced,0.36773331960042316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,4,1,balanced,0.3684106667836507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,4,1,power_law_1.01,0.3967616081237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,4,1,power_law_1.01,0.3972480058670044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,4,1,power_law_1.2,0.404966402053833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,4,1,power_law_1.2,0.406060791015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,8,1,balanced,0.29128533601760864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,8,1,balanced,0.291375994682312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,8,1,power_law_1.01,0.31658880710601806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,8,1,power_law_1.01,0.3172096014022827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,8,1,power_law_1.2,0.3245055913925171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,3072,1536,8,256,8,1,power_law_1.2,0.32639360427856445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,1,balanced,0.9882826805114746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,1,balanced,0.9936052958170573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,1,power_law_1.01,1.0441791534423828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,1,power_law_1.01,1.0828927993774413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,1,power_law_1.2,1.065120029449463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,1,power_law_1.2,1.0872447967529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,2,balanced,0.6353333393732706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,2,balanced,0.6362719933191935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,2,power_law_1.01,0.7695104122161865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,2,power_law_1.01,0.8215167999267579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,2,power_law_1.2,0.7974592208862304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,2,power_law_1.2,0.8389056205749512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,4,balanced,0.45209066073099774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,4,balanced,0.45582401752471924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,4,power_law_1.01,0.6471680164337158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,4,power_law_1.01,0.6533440113067627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,4,power_law_1.2,0.6405375957489013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,4,power_law_1.2,0.6625279903411865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,8,balanced,0.39193065961201984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,8,balanced,0.3925120035807292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,8,power_law_1.01,0.5832831859588623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,8,power_law_1.01,0.5877632141113281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,8,power_law_1.2,0.6021247863769531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,1,8,power_law_1.2,0.6107071876525879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,16,1,balanced,0.13041067123413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,16,1,balanced,0.1328213314215342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,16,1,power_law_1.01,0.13601280450820924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,16,1,power_law_1.01,0.13674880266189576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,16,1,power_law_1.2,0.13562239408493043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,16,1,power_law_1.2,0.13646080493927001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,2,1,balanced,0.5240426858266195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,2,1,balanced,0.5278400182723999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,2,1,power_law_1.01,0.5628416061401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,2,1,power_law_1.01,0.5642816066741944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,2,1,power_law_1.2,0.5520127773284912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,2,1,power_law_1.2,0.5590591907501221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,32,1,balanced,0.10114666819572449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,32,1,balanced,0.10172800223032634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,32,1,power_law_1.01,0.10406399965286255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,32,1,power_law_1.01,0.10498559474945068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,32,1,power_law_1.2,0.10496640205383301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,32,1,power_law_1.2,0.10566400289535523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,4,1,balanced,0.2961919903755188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,4,1,balanced,0.3020266691843669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,4,1,power_law_1.01,0.3169600009918213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,4,1,power_law_1.01,0.319488000869751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,4,1,power_law_1.2,0.3076672077178955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,4,1,power_law_1.2,0.31434240341186526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,8,1,balanced,0.1880693236986796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,8,1,balanced,0.19035732746124268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,8,1,power_law_1.01,0.19536639451980592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,8,1,power_law_1.01,0.19649280309677125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,8,1,power_law_1.2,0.19704960584640502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,14336,2,8,8,1,power_law_1.2,0.19790079593658447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,1,balanced,0.6739306449890137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,1,balanced,0.6799893379211426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,1,power_law_1.01,0.8448575973510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,1,power_law_1.01,0.8523520469665528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,1,power_law_1.2,0.8658495903015136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,1,power_law_1.2,0.867193603515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,128,balanced,0.2466826637585958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,128,balanced,0.24754667282104492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,128,power_law_1.01,0.26238079071044923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,128,power_law_1.01,0.2659584045410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,128,power_law_1.2,0.27292799949645996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,128,power_law_1.2,0.27345919609069824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,16,balanced,0.26943467060724896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,16,balanced,0.27129065990448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,16,power_law_1.01,0.30135679244995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,16,power_law_1.01,0.3052160024642944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,16,power_law_1.2,0.3133375883102417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,16,power_law_1.2,0.31646080017089845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,2,balanced,0.483295996983846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,2,balanced,0.48571733633677167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,2,power_law_1.01,0.5773888111114502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,2,power_law_1.01,0.5804416179656983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,2,power_law_1.2,0.5943295955657959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,2,power_law_1.2,0.6050303936004638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,32,balanced,0.2552586595217387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,32,balanced,0.25550933678944904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,32,power_law_1.01,0.2778624057769775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,32,power_law_1.01,0.28194561004638674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,32,power_law_1.2,0.29202558994293215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,32,power_law_1.2,0.29847040176391604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,4,balanced,0.3622399965922038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,4,balanced,0.36432000001271564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,4,power_law_1.01,0.4246335983276367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,4,power_law_1.01,0.43167362213134763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,4,power_law_1.2,0.44463357925415037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,4,power_law_1.2,0.45819520950317383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,64,balanced,0.24804266293843588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,64,balanced,0.24829866488774618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,64,power_law_1.01,0.26915199756622316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,64,power_law_1.01,0.27479679584503175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,64,power_law_1.2,0.2773695945739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,64,power_law_1.2,0.278387188911438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,8,balanced,0.2997173269589742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,8,balanced,0.30189865827560425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,8,power_law_1.01,0.3468480110168457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,8,power_law_1.01,0.34883201122283936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,8,power_law_1.2,0.3608000040054321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,1,8,power_law_1.2,0.36579198837280275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,16,1,balanced,0.22526933749516806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,16,1,balanced,0.22557334105173746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,16,1,power_law_1.01,0.26832640171051025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,16,1,power_law_1.01,0.26855039596557617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,16,1,power_law_1.2,0.2714240074157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,16,1,power_law_1.2,0.2735039949417114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,2,1,balanced,0.4351786772410075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,2,1,balanced,0.4355413516362508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,2,1,power_law_1.01,0.5279551982879639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,2,1,power_law_1.01,0.5297279834747315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,2,1,power_law_1.2,0.5406400203704834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,2,1,power_law_1.2,0.5427648067474365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,32,1,balanced,0.2153279980023702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,32,1,balanced,0.21612799167633057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,32,1,power_law_1.01,0.24609920978546143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,32,1,power_law_1.01,0.2477952003479004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,32,1,power_law_1.2,0.24972159862518312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,32,1,power_law_1.2,0.25027201175689695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,4,1,balanced,0.3088853359222412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,4,1,balanced,0.30958400170008343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,4,1,power_law_1.01,0.3697216033935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,4,1,power_law_1.01,0.37389440536499025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,4,1,power_law_1.2,0.37715198993682864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,4,1,power_law_1.2,0.37882239818573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,8,1,balanced,0.26180267333984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,8,1,balanced,0.26258132855097455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,8,1,power_law_1.01,0.30760319232940675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,8,1,power_law_1.01,0.3084671974182129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,8,1,power_law_1.2,0.31240320205688477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,1536,8,128,8,1,power_law_1.2,0.3136255979537964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,1,balanced,4.014128049214681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,1,balanced,4.054138819376628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,1,power_law_1.01,4.729983901977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,1,power_law_1.01,4.739372634887696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,1,power_law_1.2,4.873881530761719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,1,power_law_1.2,4.957696151733399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,128,balanced,0.8796160221099854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,128,balanced,0.881493330001831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,128,power_law_1.01,0.9110272407531739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,128,power_law_1.01,0.9117440223693848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,128,power_law_1.2,0.9227968215942383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,128,power_law_1.2,0.9268159866333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,16,balanced,1.055509328842163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,16,balanced,1.0590720176696777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,16,power_law_1.01,1.134995174407959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,16,power_law_1.01,1.1369088172912598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,16,power_law_1.2,1.1638591766357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,16,power_law_1.2,1.1771967887878418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,2,balanced,2.4144959449768066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,2,balanced,2.4610400199890137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,2,power_law_1.01,2.774412727355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,2,power_law_1.01,2.7942975997924804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,2,power_law_1.2,2.857062339782715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,2,power_law_1.2,2.9165695190429686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,256,balanced,0.8702560265858968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,256,balanced,0.871941328048706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,256,power_law_1.01,0.8934144020080567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,256,power_law_1.01,0.8975744247436523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,256,power_law_1.2,0.9031295776367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,256,power_law_1.2,0.9117055892944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,32,balanced,0.9552799860636393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,32,balanced,0.9607679843902588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,32,power_law_1.01,1.0155455589294433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,32,power_law_1.01,1.0295167922973634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,32,power_law_1.2,1.0406335830688476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,32,power_law_1.2,1.050489616394043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,4,balanced,1.6195893287658691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,4,balanced,1.6266345977783203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,4,power_law_1.01,1.8301120758056642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,4,power_law_1.01,1.841164779663086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,4,power_law_1.2,1.8933120727539063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,4,power_law_1.2,1.9142080307006837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,64,balanced,0.9067626794179281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,64,balanced,0.9080266952514648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,64,power_law_1.01,0.9454591751098633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,64,power_law_1.01,0.9511360168457031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,64,power_law_1.2,0.9689087867736816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,64,power_law_1.2,0.9756095886230469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,8,balanced,1.2518293062845867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,8,balanced,1.2576853434244792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,8,power_law_1.01,1.3794879913330078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,8,power_law_1.01,1.3802111625671387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,8,power_law_1.2,1.4081536293029786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,1,8,power_law_1.2,1.4159423828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,16,1,balanced,6.000570933024089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,16,1,balanced,6.385221481323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,16,1,power_law_1.01,8.242150115966798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,16,1,power_law_1.01,8.300434875488282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,16,1,power_law_1.2,8.61254425048828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,16,1,power_law_1.2,8.741004943847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,2,1,balanced,2.226933320363363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,2,1,balanced,2.2441226641337075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,2,1,power_law_1.01,2.519046401977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,2,1,power_law_1.01,2.5376895904541015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,2,1,power_law_1.2,2.6226816177368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,2,1,power_law_1.2,2.6443456649780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,32,1,balanced,4.173263867696126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,32,1,balanced,4.2538401285807295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,32,1,power_law_1.01,5.712422561645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,32,1,power_law_1.01,5.748160171508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,32,1,power_law_1.2,5.938515090942383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,32,1,power_law_1.2,5.9467521667480465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,4,1,balanced,1.3517173131306965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,4,1,balanced,1.3628692626953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,4,1,power_law_1.01,1.5715007781982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,4,1,power_law_1.01,1.574240016937256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,4,1,power_law_1.2,1.6215551376342774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,4,1,power_law_1.2,1.627302360534668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,8,1,balanced,0.9434560139973959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,8,1,balanced,0.9438772996266683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,8,1,power_law_1.01,1.0924032211303711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,8,1,power_law_1.01,1.096076774597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,8,1,power_law_1.2,1.1178879737854004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,4096,2688,22,512,8,1,power_law_1.2,1.121395206451416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,1,balanced,1.5646826426188152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,1,balanced,1.571381409962972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,1,power_law_1.01,1.6771711349487304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,1,power_law_1.01,1.7139455795288085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,1,power_law_1.2,1.672127914428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,1,power_law_1.2,1.6856128692626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,2,balanced,0.9307680130004883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,2,balanced,0.9499466419219971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,2,power_law_1.01,1.2272192001342774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,2,power_law_1.01,1.2800576210021972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,2,power_law_1.2,1.199065589904785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,2,power_law_1.2,1.3180352210998536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,4,balanced,0.6335893472035726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,4,balanced,0.6423946619033813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,4,power_law_1.01,0.8762751579284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,4,power_law_1.01,0.9556927680969238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,4,power_law_1.2,0.9566207885742187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,4,power_law_1.2,1.034278392791748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,8,balanced,0.4782400131225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,8,balanced,0.4817546606063843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,8,power_law_1.01,0.7629951953887939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,8,power_law_1.01,0.7908800125122071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,8,power_law_1.2,0.8245247840881348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,1,8,power_law_1.2,0.8699328422546386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,16,1,balanced,0.18399999539057413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,16,1,balanced,0.1843573252360026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,16,1,power_law_1.01,0.18958719968795776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,16,1,power_law_1.01,0.19209599494934082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,16,1,power_law_1.2,0.18826240301132202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,16,1,power_law_1.2,0.19779200553894044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,2,1,balanced,0.7945066293080648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,2,1,balanced,0.8046613534291586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,2,1,power_law_1.01,0.8843839645385743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,2,1,power_law_1.01,0.889958381652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,2,1,power_law_1.2,0.8887935638427734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,2,1,power_law_1.2,0.907084846496582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,32,1,balanced,0.13392000397046408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,32,1,balanced,0.13434666395187378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,32,1,power_law_1.01,0.14401919841766359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,32,1,power_law_1.01,0.1445312023162842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,32,1,power_law_1.2,0.13928960561752318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,32,1,power_law_1.2,0.14421119689941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,4,1,balanced,0.43611733118693036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,4,1,balanced,0.44232531388600665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,4,1,power_law_1.01,0.4728831768035889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,4,1,power_law_1.01,0.482528018951416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,4,1,power_law_1.2,0.4745664119720459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,4,1,power_law_1.2,0.48944640159606934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,8,1,balanced,0.27187200387318927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,8,1,balanced,0.27719465891520184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,8,1,power_law_1.01,0.27996799945831297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,8,1,power_law_1.01,0.28787200450897216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,8,1,power_law_1.2,0.28229119777679446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,16384,2,8,8,1,power_law_1.2,0.2853440046310425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,1,balanced,2.0506879488627114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,1,balanced,2.15557861328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,1,power_law_1.01,2.2551103591918946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,1,power_law_1.01,2.268838310241699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,1,power_law_1.2,2.3373952865600587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,1,power_law_1.2,2.3592832565307615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,128,balanced,0.3909173409144084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,128,balanced,0.3924266497294108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,128,power_law_1.01,0.41069440841674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,128,power_law_1.01,0.41240320205688474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,128,power_law_1.2,0.418233585357666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,128,power_law_1.2,0.4279359817504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,16,balanced,0.49113066991170246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,16,balanced,0.49352534612019855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,16,power_law_1.01,0.5246592044830323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,16,power_law_1.01,0.5393856048583985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,16,power_law_1.2,0.5469567775726318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,16,power_law_1.2,0.5546751976013183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,2,balanced,1.25654403368632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,2,balanced,1.257525364557902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,2,power_law_1.01,1.360588836669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,2,power_law_1.01,1.3691264152526856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,2,power_law_1.2,1.3887359619140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,2,power_law_1.2,1.4320063591003418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,256,balanced,0.38581868012746173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,256,balanced,0.38714667161305744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,256,power_law_1.01,0.398144006729126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,256,power_law_1.01,0.3994623899459839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,256,power_law_1.2,0.4119552135467529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,256,power_law_1.2,0.4141119956970215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,32,balanced,0.43182400862375897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,32,balanced,0.43375468254089355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,32,power_law_1.01,0.4571199893951416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,32,power_law_1.01,0.46190719604492186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,32,power_law_1.2,0.4742464065551758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,32,power_law_1.2,0.47713279724121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,4,balanced,0.8235200246175131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,4,balanced,0.8262026309967041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,4,power_law_1.01,0.8916223526000977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,4,power_law_1.01,0.907750415802002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,4,power_law_1.2,0.9183808326721191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,4,power_law_1.2,0.9295488357543945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,64,balanced,0.40132800738016766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,64,balanced,0.40300265947977704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,64,power_law_1.01,0.4289408206939697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,64,power_law_1.01,0.4316544055938721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,64,power_law_1.2,0.4405375957489014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,64,power_law_1.2,0.4538303852081299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,8,balanced,0.6013226509094238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,8,balanced,0.6034613450368246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,8,power_law_1.01,0.6459263801574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,8,power_law_1.01,0.6574912071228027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,8,power_law_1.2,0.6737152099609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,1,8,power_law_1.2,0.6786367893218994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,16,1,balanced,0.44190935293833417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,16,1,balanced,0.44227198759714764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,16,1,power_law_1.01,0.48762240409851076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,16,1,power_law_1.01,0.49066882133483886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,16,1,power_law_1.2,0.5028096199035644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,16,1,power_law_1.2,0.506604814529419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,2,1,balanced,1.1687733332316081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,2,1,balanced,1.1699466705322266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,2,1,power_law_1.01,1.2766655921936034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,2,1,power_law_1.01,1.2913599967956544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,2,1,power_law_1.2,1.3319040298461915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,2,1,power_law_1.2,1.3323776245117187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,32,1,balanced,0.39800000190734863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,32,1,balanced,0.3983786503473918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,32,1,power_law_1.01,0.44968318939208984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,32,1,power_law_1.01,0.4499519824981689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,32,1,power_law_1.2,0.45919361114501955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,32,1,power_law_1.2,0.45934720039367677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,4,1,balanced,0.741866668065389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,4,1,balanced,0.7434666951497396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,4,1,power_law_1.01,0.8145855903625489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,4,1,power_law_1.01,0.8163007736206055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,4,1,power_law_1.2,0.8445119857788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,4,1,power_law_1.2,0.8475711822509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,8,1,balanced,0.5493919849395752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,8,1,balanced,0.5498453378677368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,8,1,power_law_1.01,0.598035192489624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,8,1,power_law_1.01,0.5980544090270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,8,1,power_law_1.2,0.6116479873657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2048,8,256,8,1,power_law_1.2,0.6122879981994629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,1,balanced,1.7385600407918294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,1,balanced,1.7710347175598145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,1,power_law_1.01,2.100268745422363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,1,power_law_1.01,2.11144962310791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,1,power_law_1.2,2.2136831283569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,1,power_law_1.2,2.2367103576660154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,16,balanced,0.4557013511657715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,16,balanced,0.4559573332468669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,16,power_law_1.01,0.5232831954956054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,16,power_law_1.01,0.5238272190093994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,16,power_law_1.2,0.5493696212768555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,16,power_law_1.2,0.5676544189453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,2,balanced,1.0640106995900471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,2,balanced,1.0654773712158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,2,power_law_1.01,1.2801983833312989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,2,power_law_1.01,1.300057601928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,2,power_law_1.2,1.3153727531433106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,2,power_law_1.2,1.333952045440674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,32,balanced,0.4094293514887492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,32,balanced,0.4103413422902425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,32,power_law_1.01,0.45571198463439944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,32,power_law_1.01,0.4666816234588623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,32,power_law_1.2,0.4759552001953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,32,power_law_1.2,0.49992961883544923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,4,balanced,0.7185813585917155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,4,balanced,0.7206453482309977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,4,power_law_1.01,0.8530624389648438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,4,power_law_1.01,0.8670783996582031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,4,power_law_1.2,0.8771648406982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,4,power_law_1.2,0.9014080047607422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,8,balanced,0.5468693176905314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,8,balanced,0.5478773514429728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,8,power_law_1.01,0.6471807956695557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,8,power_law_1.01,0.6478591918945312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,8,power_law_1.2,0.6597311973571778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,1,8,power_law_1.2,0.6802879810333252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,16,1,balanced,0.3842879931131999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,16,1,balanced,0.38482666015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,16,1,power_law_1.01,0.4547840118408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,16,1,power_law_1.01,0.45531520843505857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,16,1,power_law_1.2,0.45864319801330566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,16,1,power_law_1.2,0.46077442169189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,2,1,balanced,0.9785119692484537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,2,1,balanced,0.9851093292236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,2,1,power_law_1.01,1.1823360443115234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,2,1,power_law_1.01,1.1836416244506835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,2,1,power_law_1.2,1.2143487930297852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,2,1,power_law_1.2,1.2196288108825684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,32,1,balanced,0.3553813298543294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,32,1,balanced,0.35547733306884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,32,1,power_law_1.01,0.3972480058670044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,32,1,power_law_1.01,0.3992511987686157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,32,1,power_law_1.2,0.4011199951171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,32,1,power_law_1.2,0.4033664226531982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,4,1,balanced,0.628053347269694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,4,1,balanced,0.6284480094909668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,4,1,power_law_1.01,0.75033597946167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,4,1,power_law_1.01,0.7565760135650634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,4,1,power_law_1.2,0.7634751796722412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,4,1,power_law_1.2,0.7641471862792969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,8,1,balanced,0.4470506509145101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,8,1,balanced,0.44857601324717206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,8,1,power_law_1.01,0.5425407886505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,8,1,power_law_1.01,0.5460159778594971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,8,1,power_law_1.2,0.5477824211120605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,6144,2560,8,160,8,1,power_law_1.2,0.5479487895965576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,1,balanced,2.4589759508768716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,1,balanced,2.5559733708699546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,1,power_law_1.01,2.597868728637695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,1,power_law_1.01,2.648089599609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,1,power_law_1.2,2.7260223388671876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,1,power_law_1.2,2.8173120498657225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,128,balanced,0.4265013138453166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,128,balanced,0.429690678914388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,128,power_law_1.01,0.4467264175415039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,128,power_law_1.01,0.4522751808166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,128,power_law_1.2,0.462553596496582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,128,power_law_1.2,0.4659264087677002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,16,balanced,0.5471573273340861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,16,balanced,0.5477706591288248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,16,power_law_1.01,0.5847871780395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,16,power_law_1.01,0.5896512031555176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,16,power_law_1.2,0.617523193359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,16,power_law_1.2,0.6212480068206787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,2,balanced,1.4397385915120442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,2,balanced,1.4675200780232747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,2,power_law_1.01,1.5185791969299316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,2,power_law_1.01,1.5459327697753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,2,power_law_1.2,1.6227840423583983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,2,power_law_1.2,1.6363008499145508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,256,balanced,0.4221920172373454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,256,balanced,0.42236268520355225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,256,power_law_1.01,0.43777918815612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,256,power_law_1.01,0.43790721893310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,256,power_law_1.2,0.450105619430542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,256,power_law_1.2,0.46035199165344237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,32,balanced,0.47472532590230304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,32,balanced,0.47605331738789874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,32,power_law_1.01,0.513478422164917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,32,power_law_1.01,0.5148416042327881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,32,power_law_1.2,0.5295743942260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,32,power_law_1.2,0.5341695785522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,4,balanced,0.930618683497111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,4,balanced,0.9328373273213705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,4,power_law_1.01,0.9962880134582519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,4,power_law_1.01,1.0007616043090821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,4,power_law_1.2,1.0378368377685547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,4,power_law_1.2,1.0547519683837892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,64,balanced,0.43935998280843097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,64,balanced,0.44091200828552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,64,power_law_1.01,0.46966400146484377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,64,power_law_1.01,0.47212800979614256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,64,power_law_1.2,0.48698878288269043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,64,power_law_1.2,0.4964479923248291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,8,balanced,0.6744426886240641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,8,balanced,0.6757760047912598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,8,power_law_1.01,0.7256832122802734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,8,power_law_1.01,0.7364672183990478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,8,power_law_1.2,0.7598656177520752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,1,8,power_law_1.2,0.759987211227417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,16,1,balanced,0.5045386552810669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,16,1,balanced,0.5047573248545328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,16,1,power_law_1.01,0.5630591869354248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,16,1,power_law_1.01,0.5635136127471924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,16,1,power_law_1.2,0.5754816055297851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,16,1,power_law_1.2,0.5803840160369873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,2,1,balanced,1.3412426312764485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,2,1,balanced,1.3633119265238445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,2,1,power_law_1.01,1.4606911659240722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,2,1,power_law_1.01,1.4670144081115724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,2,1,power_law_1.2,1.524665641784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,2,1,power_law_1.2,1.539743995666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,32,1,balanced,0.4551680088043213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,32,1,balanced,0.4561013380686442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,32,1,power_law_1.01,0.5095168113708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,32,1,power_law_1.01,0.5129087924957275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,32,1,power_law_1.2,0.5243264198303222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,32,1,power_law_1.2,0.5296383857727051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,4,1,balanced,0.8520479996999105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,4,1,balanced,0.8528800010681152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,4,1,power_law_1.01,0.9322879791259766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,4,1,power_law_1.01,0.9368000030517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,4,1,power_law_1.2,0.9728384017944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,4,1,power_law_1.2,0.9777279853820801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,8,1,balanced,0.6301279862721761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,8,1,balanced,0.6331093311309814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,8,1,power_law_1.01,0.6817599773406983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,8,1,power_law_1.01,0.6853504180908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,8,1,power_law_1.2,0.7028031826019288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,256,8,1,power_law_1.2,0.7044352054595947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,1,balanced,3.677333196004232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,1,balanced,3.677365303039551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,1,power_law_1.01,3.4661441802978517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,1,power_law_1.01,3.4841281890869142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,1,power_law_1.2,3.6586559295654295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,1,power_law_1.2,3.74505615234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,128,balanced,0.4902240037918091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,128,balanced,0.49134401480356854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,128,power_law_1.01,0.5057983875274659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,128,power_law_1.01,0.5068863868713379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,128,power_law_1.2,0.5211967945098877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,128,power_law_1.2,0.5219391822814942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,16,balanced,0.6624639828999838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,16,balanced,0.665114680926005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,16,power_law_1.01,0.6815231800079345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,16,power_law_1.01,0.6877056121826172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,16,power_law_1.2,0.7039103984832764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,16,power_law_1.2,0.7154816150665283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,2,balanced,1.9861706097920735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,2,balanced,2.01418670018514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,2,power_law_1.01,1.9625024795532227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,2,power_law_1.01,1.999692726135254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,2,power_law_1.2,2.059564781188965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,2,power_law_1.2,2.0692800521850585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,32,balanced,0.5662506818771362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,32,balanced,0.5666933457056681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,32,power_law_1.01,0.5855743885040283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,32,power_law_1.01,0.5921472072601318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,32,power_law_1.2,0.6020607948303223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,32,power_law_1.2,0.6063231945037841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,4,balanced,1.2274400393168132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,4,balanced,1.227834701538086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,4,power_law_1.01,1.2408831596374512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,4,power_law_1.01,1.2547136306762696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,4,power_law_1.2,1.3089599609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,4,power_law_1.2,1.317369556427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,64,balanced,0.5137813488642374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,64,balanced,0.5163733164469401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,64,power_law_1.01,0.5381311893463134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,64,power_law_1.01,0.5393727779388428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,64,power_law_1.2,0.5414783954620361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,64,power_law_1.2,0.5511551856994629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,8,balanced,0.8582133452097574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,8,balanced,0.8583412965138754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,8,power_law_1.01,0.8683775901794434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,8,power_law_1.01,0.8771903991699219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,8,power_law_1.2,0.8955136299133301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,1,8,power_law_1.2,0.897977638244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,16,1,balanced,0.6646613279978434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,16,1,balanced,0.667792002360026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,16,1,power_law_1.01,0.6625664234161377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,16,1,power_law_1.01,0.6656640052795411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,16,1,power_law_1.2,0.6825664043426514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,16,1,power_law_1.2,0.6864575862884521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,2,1,balanced,1.8838079770406086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,2,1,balanced,1.9958613713582356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,2,1,power_law_1.01,1.8783615112304688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,2,1,power_law_1.01,1.9256000518798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,2,1,power_law_1.2,1.963327980041504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,2,1,power_law_1.2,2.0147008895874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,32,1,balanced,0.6084853410720825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,32,1,balanced,0.6095893383026123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,32,1,power_law_1.01,0.605292797088623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,32,1,power_law_1.01,0.6101503849029541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,32,1,power_law_1.2,0.6253312110900879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,32,1,power_law_1.2,0.6309887886047363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,4,1,balanced,1.1823146343231201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,4,1,balanced,1.1842719713846843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,4,1,power_law_1.01,1.1590784072875977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,4,1,power_law_1.01,1.1673919677734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,4,1,power_law_1.2,1.2234368324279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,4,1,power_law_1.2,1.2239551544189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,8,1,balanced,0.8450613021850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,8,1,balanced,0.8463520208994547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,8,1,power_law_1.01,0.8407615661621094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,8,1,power_law_1.01,0.840998363494873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,8,1,power_law_1.2,0.8596416473388672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,2048,7168,2048,8,384,8,1,power_law_1.2,0.8611200332641602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,1,balanced,0.151119997104009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,1,balanced,0.15161599715550741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,1,power_law_1.01,0.1460736036300659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,1,power_law_1.01,0.1474303960800171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,1,power_law_1.2,0.1446720004081726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,1,power_law_1.2,0.14804480075836182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,128,balanced,0.05198933184146881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,128,balanced,0.053301334381103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,128,power_law_1.01,0.05237759947776795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,128,power_law_1.01,0.05238400101661682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,128,power_law_1.2,0.05187839865684509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,128,power_law_1.2,0.05229439735412598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,16,balanced,0.0539680023988088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,16,balanced,0.054005334774653115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,16,power_law_1.01,0.053881597518920896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,16,power_law_1.01,0.05421440005302429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,16,power_law_1.2,0.05397760272026062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,16,power_law_1.2,0.05399680137634277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,2,balanced,0.10413866241772969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,2,balanced,0.10443199674288432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,2,power_law_1.01,0.0997439980506897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,2,power_law_1.01,0.1012992024421692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,2,power_law_1.2,0.10220160484313964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,2,power_law_1.2,0.10321919918060303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,32,balanced,0.05377600093682607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,32,balanced,0.05390933156013489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,32,power_law_1.01,0.05258240103721619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,32,power_law_1.01,0.052799999713897705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,32,power_law_1.2,0.05296639800071716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,32,power_law_1.2,0.053324800729751584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,4,balanced,0.08025066554546356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,4,balanced,0.08167466521263123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,4,power_law_1.01,0.07923200130462646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,4,power_law_1.01,0.08000640273094177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,4,power_law_1.2,0.07950720191001892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,4,power_law_1.2,0.08061439990997314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,64,balanced,0.05203733344872793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,64,balanced,0.05392000079154968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,64,power_law_1.01,0.05108479857444763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,64,power_law_1.01,0.0515392005443573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,64,power_law_1.2,0.05196800231933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,64,power_law_1.2,0.05253120064735413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,8,balanced,0.060122668743133545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,8,balanced,0.06019733349482218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,8,power_law_1.01,0.060262399911880496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,8,power_law_1.01,0.061926400661468504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,8,power_law_1.2,0.06183040142059326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,1,8,power_law_1.2,0.0631168007850647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,2,1,balanced,0.09954667091369629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,2,1,balanced,0.10079999764760335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,2,1,power_law_1.01,0.09782400131225585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,2,1,power_law_1.01,0.09801599979400635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,2,1,power_law_1.2,0.09821439981460571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,2,1,power_law_1.2,0.0997439980506897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,4,1,balanced,0.07726400097211202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,4,1,balanced,0.07834666470686595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,4,1,power_law_1.01,0.07573760151863099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,4,1,power_law_1.01,0.07613440155982971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,4,1,power_law_1.2,0.07704960107803345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2048,768,8,128,4,1,power_law_1.2,0.07744640111923218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,1,balanced,0.36316800117492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,1,balanced,0.36540265878041583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,1,power_law_1.01,0.3423680067062378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,1,power_law_1.01,0.3472127914428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,1,power_law_1.2,0.3474303960800171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,1,power_law_1.2,0.3478463888168335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,128,balanced,0.07288533449172974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,128,balanced,0.07423999905586243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,128,power_law_1.01,0.0725823998451233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,128,power_law_1.01,0.07285119891166687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,128,power_law_1.2,0.07279999852180481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,128,power_law_1.2,0.07308160066604615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,16,balanced,0.08514133095741272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,16,balanced,0.08657067020734151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,16,power_law_1.01,0.08442879915237426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,16,power_law_1.01,0.08484479784965515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,16,power_law_1.2,0.08654720187187195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,16,power_law_1.2,0.08686720132827759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,2,balanced,0.22637333472569784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,2,balanced,0.2281386653582255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,2,power_law_1.01,0.21346559524536132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,2,power_law_1.01,0.2154304027557373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,2,power_law_1.2,0.21877760887145997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,2,power_law_1.2,0.2212991952896118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,32,balanced,0.0766293356815974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,32,balanced,0.07792533437410991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,32,power_law_1.01,0.07544959783554077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,32,power_law_1.01,0.07605760097503662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,32,power_law_1.2,0.07720320224761963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,32,power_law_1.2,0.07934719920158387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,4,balanced,0.1506666640440623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,4,balanced,0.1525813341140747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,4,power_law_1.01,0.1427072048187256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,4,power_law_1.01,0.14540799856185913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,4,power_law_1.2,0.1478592038154602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,4,power_law_1.2,0.14921599626541138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,64,balanced,0.0745066652695338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,64,balanced,0.0745119998852412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,64,power_law_1.01,0.07251840233802795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,64,power_law_1.01,0.07284479737281799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,64,power_law_1.2,0.07288960218429566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,64,power_law_1.2,0.07354879975318909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,8,balanced,0.11311466495196025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,8,balanced,0.11446932951609294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,8,power_law_1.01,0.10804480314254761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,8,power_law_1.01,0.11029119491577148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,8,power_law_1.2,0.10915199518203736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,1,8,power_law_1.2,0.11093759536743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,16,1,balanced,0.33018134037653607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,16,1,balanced,0.3311893343925476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,16,1,power_law_1.01,0.3081792116165161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,16,1,power_law_1.01,0.30945920944213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,16,1,power_law_1.2,0.3277760028839111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,16,1,power_law_1.2,0.3285056114196777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,2,1,balanced,0.2172373334566752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,2,1,balanced,0.2172693411509196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,2,1,power_law_1.01,0.19802240133285523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,2,1,power_law_1.01,0.20280959606170654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,2,1,power_law_1.2,0.20668160915374756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,2,1,power_law_1.2,0.20914559364318847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,32,1,balanced,0.2877546747525533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,32,1,balanced,0.29314666986465454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,32,1,power_law_1.01,0.2694080114364624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,32,1,power_law_1.01,0.2696768045425415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,32,1,power_law_1.2,0.27912321090698244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,32,1,power_law_1.2,0.28418560028076173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,4,1,balanced,0.14078399538993835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,4,1,balanced,0.14215466380119324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,4,1,power_law_1.01,0.13549439907073973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,4,1,power_law_1.01,0.1357375979423523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,4,1,power_law_1.2,0.1373247981071472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,4,1,power_law_1.2,0.1373311996459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,8,1,balanced,0.42881067593892414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,8,1,balanced,0.42918399969736737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,8,1,power_law_1.01,0.39278719425201414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,8,1,power_law_1.01,0.402239990234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,8,1,power_law_1.2,0.4108799934387207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,2688,1856,6,128,8,1,power_law_1.2,0.4165056228637695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,1,balanced,0.6138346592585245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,1,balanced,0.6145066817601522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,1,power_law_1.01,0.5384960174560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,1,power_law_1.01,0.5402112007141113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,1,power_law_1.2,0.552345609664917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,1,power_law_1.2,0.5569215774536133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,128,balanced,0.10534399747848511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,128,balanced,0.10632000366846721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,128,power_law_1.01,0.10442240238189697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,128,power_law_1.01,0.1047551989555359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,128,power_law_1.2,0.10444799661636353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,128,power_law_1.2,0.10512000322341919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,16,balanced,0.14008532961209616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,16,balanced,0.1421226660410563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,16,power_law_1.01,0.1315392017364502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,16,power_law_1.01,0.13189760446548462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,16,power_law_1.2,0.13235199451446533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,16,power_law_1.2,0.13498239517211913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,2,balanced,0.3680533170700073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,2,balanced,0.3686559995015462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,2,power_law_1.01,0.3298624038696289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,2,power_law_1.01,0.3319616079330444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,2,power_law_1.2,0.33000960350036623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,2,power_law_1.2,0.33470079898834226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,256,balanced,0.10526399811108907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,256,balanced,0.10664533575375874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,256,power_law_1.01,0.10489599704742432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,256,power_law_1.01,0.10533759593963624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,256,power_law_1.2,0.10462720394134521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,256,power_law_1.2,0.1051584005355835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,32,balanced,0.11559466520945232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,32,balanced,0.11778133114178975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,32,power_law_1.01,0.1144063949584961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,32,power_law_1.01,0.11465599536895751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,32,power_law_1.2,0.1134335994720459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,32,power_law_1.2,0.11508480310440064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,4,balanced,0.24066666762034097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,4,balanced,0.24078933397928873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,4,power_law_1.01,0.22232959270477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,4,power_law_1.01,0.22639999389648438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,4,power_law_1.2,0.22154879570007324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,4,power_law_1.2,0.2352128028869629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,64,balanced,0.1074666678905487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,64,balanced,0.10940800110499065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,64,power_law_1.01,0.10685440301895141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,64,power_law_1.01,0.10772479772567749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,64,power_law_1.2,0.10679039955139161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,64,power_law_1.2,0.10797439813613892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,8,balanced,0.17282134294509888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,8,balanced,0.17472533384958902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,8,power_law_1.01,0.1647871971130371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,8,power_law_1.01,0.16569600105285645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,8,power_law_1.2,0.16260479688644408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,1,8,power_law_1.2,0.16455039978027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,16,1,balanced,0.13691199819246927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,16,1,balanced,0.13902933398882547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,16,1,power_law_1.01,0.12434560060501099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,16,1,power_law_1.01,0.1245695948600769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,16,1,power_law_1.2,0.12466559410095215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,16,1,power_law_1.2,0.12654720544815062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,2,1,balanced,0.3458346525828044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,2,1,balanced,0.34700266520182294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,2,1,power_law_1.01,0.31036159992218015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,2,1,power_law_1.01,0.3138432025909424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,2,1,power_law_1.2,0.31130878925323485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,2,1,power_law_1.2,0.3159615993499756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,32,1,balanced,0.1172266701857249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,32,1,balanced,0.11921599507331848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,32,1,power_law_1.01,0.11042560338973999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,32,1,power_law_1.01,0.11050879955291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,32,1,power_law_1.2,0.1109887957572937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,32,1,power_law_1.2,0.1119488000869751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,4,1,balanced,0.22202134132385254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,4,1,balanced,0.22307199239730835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,4,1,power_law_1.01,0.19697279930114747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,4,1,power_law_1.01,0.1986240029335022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,4,1,power_law_1.2,0.1982143998146057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,4,1,power_law_1.2,0.20325119495391847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,8,1,balanced,0.16019733746846518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,8,1,balanced,0.16126933693885803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,8,1,power_law_1.01,0.14937599897384643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,8,1,power_law_1.01,0.1505087971687317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,8,1,power_law_1.2,0.1503424048423767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,3072,1536,8,256,8,1,power_law_1.2,0.15135999917984008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,1,balanced,0.3001386721928914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,1,balanced,0.3038453261057536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,1,power_law_1.01,0.36465280055999755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,1,power_law_1.01,0.37073919773101804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,1,power_law_1.2,0.3683775901794434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,1,power_law_1.2,0.38385920524597167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,2,balanced,0.21763734022776285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,2,balanced,0.2211093306541443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,2,power_law_1.01,0.24720640182495118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,2,power_law_1.01,0.25107200145721437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,2,power_law_1.2,0.25427200794219973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,2,power_law_1.2,0.2584575891494751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,4,balanced,0.17430933316548666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,4,balanced,0.17523199319839478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,4,power_law_1.01,0.19717119932174682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,4,power_law_1.01,0.2026304006576538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,4,power_law_1.2,0.19976320266723632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,4,power_law_1.2,0.20133121013641359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,8,balanced,0.1588266690572103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,8,balanced,0.15984533230463663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,8,power_law_1.01,0.1754047989845276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,8,power_law_1.01,0.1784832000732422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,8,power_law_1.2,0.17487360239028932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,1,8,power_law_1.2,0.1804927945137024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,16,1,balanced,0.05183466772238413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,16,1,balanced,0.054330666859944664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,16,1,power_law_1.01,0.05921279788017273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,16,1,power_law_1.01,0.06002560257911682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,16,1,power_law_1.2,0.06096640229225159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,16,1,power_law_1.2,0.06272000074386597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,2,1,balanced,0.1775839924812317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,2,1,balanced,0.17876267433166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,2,1,power_law_1.01,0.19457279443740844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,2,1,power_law_1.01,0.20838398933410646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,2,1,power_law_1.2,0.1890944004058838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,2,1,power_law_1.2,0.19863040447235109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,32,1,balanced,0.04163199911514918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,32,1,balanced,0.04223466912905375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,32,1,power_law_1.01,0.04306559860706329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,32,1,power_law_1.01,0.04340479969978332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,32,1,power_law_1.2,0.04374400079250336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,32,1,power_law_1.2,0.04447999894618988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,4,1,balanced,0.11550399661064148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,4,1,balanced,0.11607467134793599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,4,1,power_law_1.01,0.1150015950202942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,4,1,power_law_1.01,0.1186303973197937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,4,1,power_law_1.2,0.1159551978111267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,4,1,power_law_1.2,0.11649919748306274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,8,1,balanced,0.07332799832026164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,8,1,balanced,0.0765173335870107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,8,1,power_law_1.01,0.07457919716835022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,8,1,power_law_1.01,0.07657600045204163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,8,1,power_law_1.2,0.07631360292434693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,14336,2,8,8,1,power_law_1.2,0.07831680178642272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,1,balanced,0.4280800024668376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,1,balanced,0.4307680130004883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,1,power_law_1.01,0.41518077850341795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,1,power_law_1.01,0.4198463916778564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,1,power_law_1.2,0.4356031894683838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,1,power_law_1.2,0.4400191783905029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,128,balanced,0.08492799599965413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,128,balanced,0.08614400029182434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,128,power_law_1.01,0.08347520232200623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,128,power_law_1.01,0.08366720080375671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,128,power_law_1.2,0.08365439772605895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,128,power_law_1.2,0.08407679796218873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,16,balanced,0.09732266267140706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,16,balanced,0.10070932904879253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,16,power_law_1.01,0.09905920028686524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,16,power_law_1.01,0.09996799826622009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,16,power_law_1.2,0.10115200281143188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,16,power_law_1.2,0.10127359628677368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,2,balanced,0.2630133430163066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,2,balanced,0.2632426619529724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,2,power_law_1.01,0.25870718955993655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,2,power_law_1.01,0.2589184045791626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,2,power_law_1.2,0.26102399826049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,2,power_law_1.2,0.2629184007644653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,32,balanced,0.09047999978065491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,32,balanced,0.09067199627558391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,32,power_law_1.01,0.08965759873390197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,32,power_law_1.01,0.08978559970855712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,32,power_law_1.2,0.09132800102233887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,32,power_law_1.2,0.09242879748344421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,4,balanced,0.17275200287501016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,4,balanced,0.17323199907938638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,4,power_law_1.01,0.16992000341415406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,4,power_law_1.01,0.17539199590682983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,4,power_law_1.2,0.17552640438079833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,4,power_law_1.2,0.17643519639968872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,64,balanced,0.08483733733495076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,64,balanced,0.0848586658636729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,64,power_law_1.01,0.08483200073242188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,64,power_law_1.01,0.08513280153274536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,64,power_law_1.2,0.08399360179901123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,64,power_law_1.2,0.08687360286712646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,8,balanced,0.13054399689038595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,8,balanced,0.13076266646385193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,8,power_law_1.01,0.1324671983718872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,8,power_law_1.01,0.13303040266036986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,8,power_law_1.2,0.13232640027999878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,1,8,power_law_1.2,0.13304320573806763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,16,1,balanced,0.10513599713643391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,16,1,balanced,0.10674132903416951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,16,1,power_law_1.01,0.10408960580825806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,16,1,power_law_1.01,0.10542720556259155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,16,1,power_law_1.2,0.10645120143890381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,2,1,balanced,0.2536960045496623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,2,1,balanced,0.25406932830810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,2,1,power_law_1.01,0.2486272096633911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,2,1,power_law_1.01,0.24966399669647216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,2,1,power_law_1.2,0.24938879013061524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,2,1,power_law_1.2,0.24955520629882813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,32,1,balanced,0.09676800171534221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,32,1,balanced,0.09708266456921895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,32,1,power_law_1.01,0.09675520062446594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,32,1,power_law_1.01,0.09749760031700135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,32,1,power_law_1.2,0.09716479778289795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,32,1,power_law_1.2,0.09787520170211791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,4,1,balanced,0.16522666811943054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,4,1,balanced,0.16566933194796243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,4,1,power_law_1.01,0.15972479581832885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,4,1,power_law_1.01,0.16043519973754883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,4,1,power_law_1.2,0.16191359758377075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,4,1,power_law_1.2,0.16221439838409424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,8,1,balanced,0.12396267056465149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,8,1,balanced,0.12547733386357626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,8,1,power_law_1.01,0.12113280296325683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,8,1,power_law_1.01,0.12206079959869384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,8,1,power_law_1.2,0.12197120189666748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,1536,8,128,8,1,power_law_1.2,0.1245695948600769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,1,balanced,2.7554826736450195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,1,balanced,2.767039934794108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,1,power_law_1.01,2.4841856002807616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,1,power_law_1.01,2.5285951614379885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,1,power_law_1.2,2.595187187194824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,1,power_law_1.2,2.603104019165039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,128,balanced,0.3173333406448364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,128,balanced,0.31756265958150226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,128,power_law_1.01,0.3146048069000244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,128,power_law_1.01,0.3147711992263794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,128,power_law_1.2,0.31773440837860106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,128,power_law_1.2,0.31816959381103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,16,balanced,0.47522131601969403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,16,balanced,0.4772213300069173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,16,power_law_1.01,0.45975680351257325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,16,power_law_1.01,0.4646592140197754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,16,power_law_1.2,0.46691198348999025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,16,power_law_1.2,0.47057280540466306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,2,balanced,1.5273386637369792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,2,balanced,1.533023993174235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,2,power_law_1.01,1.4070719718933105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,2,power_law_1.01,1.421407985687256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,2,power_law_1.2,1.460908794403076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,2,power_law_1.2,1.4630975723266602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,256,balanced,0.3102186719576518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,256,balanced,0.31090132395426434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,256,power_law_1.01,0.3091775894165039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,256,power_law_1.01,0.30951039791107177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,256,power_law_1.2,0.3095616102218628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,256,power_law_1.2,0.3115648031234741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,32,balanced,0.3900373379389445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,32,balanced,0.39212799072265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,32,power_law_1.01,0.38436479568481446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,32,power_law_1.01,0.38480639457702637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,32,power_law_1.2,0.3850496053695679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,32,power_law_1.2,0.38869121074676516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,4,balanced,0.9270293712615967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,4,balanced,0.9313279787699381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,4,power_law_1.01,0.8623040199279786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,4,power_law_1.01,0.8728832244873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,4,power_law_1.2,0.9011327743530273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,4,power_law_1.2,0.9038592338562011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,64,balanced,0.33853332201639813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,64,balanced,0.3398933410644531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,64,power_law_1.01,0.33096320629119874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,64,power_law_1.01,0.3348095893859863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,64,power_law_1.2,0.3418495893478394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,64,power_law_1.2,0.3450432062149048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,8,balanced,0.6271680196126302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,8,balanced,0.6298773288726807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,8,power_law_1.01,0.5929664134979248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,8,power_law_1.01,0.6002048015594482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,8,power_law_1.2,0.612063980102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,1,8,power_law_1.2,0.6169343948364258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,16,1,balanced,2.300314744313558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,16,1,balanced,2.303717295328776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,16,1,power_law_1.01,2.100275230407715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,16,1,power_law_1.01,2.133286476135254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,16,1,power_law_1.2,2.2031360626220704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,16,1,power_law_1.2,2.2390207290649413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,2,1,balanced,1.4259840647379558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,2,1,balanced,1.4557545979817708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,2,1,power_law_1.01,1.297555160522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,2,1,power_law_1.01,1.3258624076843262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,2,1,power_law_1.2,1.3618240356445312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,2,1,power_law_1.2,1.3712832450866699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,32,1,balanced,1.787552038828532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,32,1,balanced,1.7905227343241374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,32,1,power_law_1.01,1.632441520690918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,32,1,power_law_1.01,1.6557888031005858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,32,1,power_law_1.2,1.7302656173706055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,32,1,power_law_1.2,1.7553792953491212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,4,1,balanced,0.8128800392150879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,4,1,balanced,0.8153759638468424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,4,1,power_law_1.01,0.7473279953002929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,4,1,power_law_1.01,0.751417589187622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,4,1,power_law_1.2,0.7723775863647461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,4,1,power_law_1.2,0.7828095912933349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,8,1,balanced,0.5120533307393392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,8,1,balanced,0.5124586820602417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,8,1,power_law_1.01,0.48129920959472655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,8,1,power_law_1.01,0.48210558891296384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,8,1,power_law_1.2,0.49511041641235354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,4096,2688,22,512,8,1,power_law_1.2,0.5008831977844238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,1,balanced,0.4509173234303792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,1,balanced,0.45333866278330487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,1,power_law_1.01,0.5969024181365967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,1,power_law_1.01,0.5987520217895508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,1,power_law_1.2,0.6016064167022706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,1,power_law_1.2,0.6227136135101319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,2,balanced,0.29397332668304443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,2,balanced,0.29665066798528034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,2,power_law_1.01,0.37223680019378663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,2,power_law_1.01,0.3772480010986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,2,power_law_1.2,0.36205439567565917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,2,power_law_1.2,0.4133120059967041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,4,balanced,0.21928532918294272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,4,balanced,0.22150933742523193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,4,power_law_1.01,0.25848960876464844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,4,power_law_1.01,0.28063359260559084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,4,power_law_1.2,0.26752638816833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,4,power_law_1.2,0.2765503883361816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,8,balanced,0.19329599539438883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,8,balanced,0.193615992863973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,8,power_law_1.01,0.21580159664154053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,8,power_law_1.01,0.22909440994262695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,8,power_law_1.2,0.2149951934814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,1,8,power_law_1.2,0.2228543996810913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,16,1,balanced,0.07986666758855183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,16,1,balanced,0.08018133540948232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,16,1,power_law_1.01,0.08319360017776489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,16,1,power_law_1.01,0.08341119885444641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,16,1,power_law_1.2,0.08293759822845459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,16,1,power_law_1.2,0.08350080251693726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,2,1,balanced,0.2566133340199788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,2,1,balanced,0.25726399819056195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,2,1,power_law_1.01,0.3050175905227661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,2,1,power_law_1.01,0.3057152032852173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,2,1,power_law_1.2,0.3126591920852661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,2,1,power_law_1.2,0.31697280406951905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,32,1,balanced,0.05992533266544342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,32,1,balanced,0.06425599753856659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,32,1,power_law_1.01,0.07094399929046631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,32,1,power_law_1.01,0.07100160121917724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,32,1,power_law_1.2,0.06965759992599488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,32,1,power_law_1.2,0.07124480009078979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,4,1,balanced,0.158160001039505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,4,1,balanced,0.16065067052841187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,4,1,power_law_1.01,0.16962560415267944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,4,1,power_law_1.01,0.17696640491485596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,4,1,power_law_1.2,0.16775039434432984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,4,1,power_law_1.2,0.17222399711608888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,8,1,balanced,0.10059199730555217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,8,1,balanced,0.10073066751162212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,8,1,power_law_1.01,0.1074560046195984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,8,1,power_law_1.01,0.11216000318527222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,8,1,power_law_1.2,0.10453120470046998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,16384,2,8,8,1,power_law_1.2,0.11196800470352172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,1,balanced,1.5852746963500977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,1,balanced,1.5867093404134114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,1,power_law_1.01,1.336691188812256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,1,power_law_1.01,1.3736703872680665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,1,power_law_1.2,1.3582592010498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,1,power_law_1.2,1.3801088333129883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,128,balanced,0.16641066471735635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,128,balanced,0.16659733653068542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,128,power_law_1.01,0.1653887987136841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,128,power_law_1.01,0.16577279567718506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,128,power_law_1.2,0.16480000019073487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,128,power_law_1.2,0.16548479795455934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,16,balanced,0.25520533323287964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,16,balanced,0.2564586599667867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,16,power_law_1.01,0.24284160137176514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,16,power_law_1.01,0.245849609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,16,power_law_1.2,0.2440959930419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,16,power_law_1.2,0.24895360469818115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,2,balanced,0.8723519643147787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,2,balanced,0.8772266705830892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,2,power_law_1.01,0.7583807945251465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,2,power_law_1.01,0.7721856117248536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,2,power_law_1.2,0.7893887996673584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,2,power_law_1.2,0.8124735832214356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,256,balanced,0.16431466738382974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,256,balanced,0.16497066617012024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,256,power_law_1.01,0.16368000507354735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,256,power_law_1.01,0.1648576021194458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,256,power_law_1.2,0.1627071976661682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,256,power_law_1.2,0.16417920589447021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,32,balanced,0.19670399030049643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,32,balanced,0.19701866308848062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,32,power_law_1.01,0.18240640163421631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,32,power_law_1.01,0.19197440147399902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,32,power_law_1.2,0.18762880563735962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,32,power_law_1.2,0.19173120260238646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,4,balanced,0.515999992688497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,4,balanced,0.5170666774113973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,4,power_law_1.01,0.466707181930542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,4,power_law_1.01,0.4787456035614014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,4,power_law_1.2,0.4693759918212891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,4,power_law_1.2,0.475270414352417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,64,balanced,0.17227200667063394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,64,balanced,0.1732106606165568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,64,power_law_1.01,0.16943360567092897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,64,power_law_1.01,0.17003519535064698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,64,power_law_1.2,0.1699136018753052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,64,power_law_1.2,0.17118079662323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,8,balanced,0.344709316889445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,8,balanced,0.3447999954223633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,8,power_law_1.01,0.3265088081359863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,8,power_law_1.01,0.33520638942718506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,8,power_law_1.2,0.3215679883956909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,1,8,power_law_1.2,0.3291647911071777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,16,1,balanced,0.2510133385658264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,16,1,balanced,0.25145065784454346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,16,1,power_law_1.01,0.22076160907745362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,16,1,power_law_1.01,0.23311359882354737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,16,1,power_law_1.2,0.2246016025543213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,16,1,power_law_1.2,0.2301248073577881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,2,1,balanced,0.823253313700358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,2,1,balanced,0.8258986473083496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,2,1,power_law_1.01,0.7177087783813476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,2,1,power_law_1.01,0.7189631938934327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,2,1,power_law_1.2,0.7211008071899414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,2,1,power_law_1.2,0.7420800209045411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,32,1,balanced,0.2097439964612325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,32,1,balanced,0.21079999208450317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,32,1,power_law_1.01,0.19664000272750853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,32,1,power_law_1.01,0.19790079593658447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,32,1,power_law_1.2,0.19639040231704713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,32,1,power_law_1.2,0.19866880178451538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,4,1,balanced,0.47623999913533527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,4,1,balanced,0.4779733419418335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,4,1,power_law_1.01,0.4272448062896729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,4,1,power_law_1.01,0.43045759201049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,4,1,power_law_1.2,0.42951040267944335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,4,1,power_law_1.2,0.4396224021911621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,8,1,balanced,0.3226880033810933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,8,1,balanced,0.324074665705363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,8,1,power_law_1.01,0.2850239992141724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,8,1,power_law_1.01,0.2925568103790283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,8,1,power_law_1.2,0.2909503936767578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2048,8,256,8,1,power_law_1.2,0.2916352033615112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,1,balanced,1.2353920141855876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,1,balanced,1.2399520079294841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,1,power_law_1.01,1.1618176460266114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,1,power_law_1.01,1.1681407928466796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,1,power_law_1.2,1.1930624008178712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,1,power_law_1.2,1.1980992317199708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,16,balanced,0.20827200015385947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,16,balanced,0.20947732528050741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,16,power_law_1.01,0.20565760135650635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,16,power_law_1.01,0.2090751886367798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,16,power_law_1.2,0.2089855909347534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,16,power_law_1.2,0.2092736005783081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,2,balanced,0.6838400363922119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,2,balanced,0.6860427061716715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,2,power_law_1.01,0.6414271831512451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,2,power_law_1.01,0.6667391777038574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,2,power_law_1.2,0.6667136192321778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,2,power_law_1.2,0.6667200088500976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,32,balanced,0.1527786652247111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,32,balanced,0.15402666727701822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,32,power_law_1.01,0.15156480073928832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,32,power_law_1.01,0.15445760488510132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,32,power_law_1.2,0.15591039657592773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,32,power_law_1.2,0.16387840509414672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,4,balanced,0.41139201323191327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,4,balanced,0.41327468554178876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,4,power_law_1.01,0.3987519979476929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,4,power_law_1.01,0.4010623931884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,4,power_law_1.2,0.40344958305358886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,4,power_law_1.2,0.4040383815765381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,8,balanced,0.2750133275985718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,8,balanced,0.27694932619730633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,8,power_law_1.01,0.25908479690551756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,8,power_law_1.01,0.26735999584198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,8,power_law_1.2,0.2746560096740723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,1,8,power_law_1.2,0.27506558895111083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,16,1,balanced,0.2063680092493693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,16,1,balanced,0.20769067605336508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,16,1,power_law_1.01,0.20257918834686278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,16,1,power_law_1.01,0.20291199684143066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,16,1,power_law_1.2,0.20322558879852295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,16,1,power_law_1.2,0.20442240238189696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,2,1,balanced,0.6604373455047607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,2,1,balanced,0.6643040180206299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,2,1,power_law_1.01,0.6200831890106201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,2,1,power_law_1.01,0.6224319934844971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,2,1,power_law_1.2,0.6293888092041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,2,1,power_law_1.2,0.6356607913970947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,32,1,balanced,0.16267733772595724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,32,1,balanced,0.16343466440836588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,32,1,power_law_1.01,0.1575551986694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,32,1,power_law_1.01,0.1585536003112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,32,1,power_law_1.2,0.16131839752197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,32,1,power_law_1.2,0.16204160451889038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,4,1,balanced,0.37836265563964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,4,1,balanced,0.38096535205841064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,4,1,power_law_1.01,0.363974404335022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,4,1,power_law_1.01,0.36652159690856934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,4,1,power_law_1.2,0.37072000503540037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,4,1,power_law_1.2,0.37097599506378176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,8,1,balanced,0.24655999739964804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,8,1,balanced,0.2466933329900106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,8,1,power_law_1.01,0.23714559078216552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,8,1,power_law_1.01,0.23816959857940673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,8,1,power_law_1.2,0.24315519332885743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,6144,2560,8,160,8,1,power_law_1.2,0.2435904026031494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,1,balanced,1.8403627077738445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,1,balanced,1.8491360346476238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,1,power_law_1.01,1.556383991241455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,1,power_law_1.01,1.5842432022094726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,1,power_law_1.2,1.6040704727172852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,1,power_law_1.2,1.6141183853149415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,128,balanced,0.18290666739145914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,128,balanced,0.1829973260561625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,128,power_law_1.01,0.17984000444412232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,128,power_law_1.01,0.17990399599075318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,128,power_law_1.2,0.1796223998069763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,128,power_law_1.2,0.1799999952316284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,16,balanced,0.28958932558695477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,16,balanced,0.29078932603200275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,16,power_law_1.01,0.2695168018341064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,16,power_law_1.01,0.27876479625701905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,16,power_law_1.2,0.2797696113586426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,16,power_law_1.2,0.28108160495758056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,2,balanced,0.9976106484731039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,2,balanced,1.0038613478342693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,2,power_law_1.01,0.8878399848937988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,2,power_law_1.01,0.8941184043884277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,2,power_law_1.2,0.8972415924072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,2,power_law_1.2,0.9140416145324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,256,balanced,0.17893866697947183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,256,balanced,0.1808639963467916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,256,power_law_1.01,0.17825280427932738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,256,power_law_1.01,0.17848960161209107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,256,power_law_1.2,0.1794368028640747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,256,power_law_1.2,0.17989759445190429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,32,balanced,0.22039467096328735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,32,balanced,0.22220265865325928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,32,power_law_1.01,0.21332480907440185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,32,power_law_1.01,0.21356799602508544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,32,power_law_1.2,0.21004159450531007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,32,power_law_1.2,0.21159040927886963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,4,balanced,0.5884960095087687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,4,balanced,0.5895626544952393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,4,power_law_1.01,0.5396607875823974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,4,power_law_1.01,0.5474431991577149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,4,power_law_1.2,0.5462336063385009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,4,power_law_1.2,0.5650112152099609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,64,balanced,0.18691732486089072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,64,balanced,0.18825600544611612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,64,power_law_1.01,0.18495999574661254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,64,power_law_1.01,0.18584959506988524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,64,power_law_1.2,0.1851263999938965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,64,power_law_1.2,0.18597760200500488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,8,balanced,0.38811735312143963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,8,balanced,0.39193065961201984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,8,power_law_1.01,0.35789439678192136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,8,power_law_1.01,0.3709887981414795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,8,power_law_1.2,0.3636928081512451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,1,8,power_law_1.2,0.372326397895813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,16,1,balanced,0.2871840000152588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,16,1,balanced,0.2874506711959839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,16,1,power_law_1.01,0.25107200145721437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,16,1,power_law_1.01,0.26652801036834717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,16,1,power_law_1.2,0.2640127897262573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,16,1,power_law_1.2,0.26782081127166746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,2,1,balanced,0.9513066609700521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,2,1,balanced,0.9599466323852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,2,1,power_law_1.01,0.8321920394897461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,2,1,power_law_1.01,0.8333184242248535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,2,1,power_law_1.2,0.830508804321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,2,1,power_law_1.2,0.8758591651916504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,32,1,balanced,0.2371573249499003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,32,1,balanced,0.2381653388341268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,32,1,power_law_1.01,0.2240000009536743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,32,1,power_law_1.01,0.22444798946380615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,32,1,power_law_1.2,0.2236799955368042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,32,1,power_law_1.2,0.22376320362091065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,4,1,balanced,0.5501706600189209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,4,1,balanced,0.5510773261388143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,4,1,power_law_1.01,0.4954944133758545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,4,1,power_law_1.01,0.5037504196166992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,4,1,power_law_1.2,0.4940032005310059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,4,1,power_law_1.2,0.4994944095611572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,8,1,balanced,0.3710026741027832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,8,1,balanced,0.3715466658274333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,8,1,power_law_1.01,0.32460799217224123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,8,1,power_law_1.01,0.3375296115875244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,8,1,power_law_1.2,0.33118720054626466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,256,8,1,power_law_1.2,0.34161279201507566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,1,balanced,2.7783679962158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,1,balanced,2.78548272450765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,1,power_law_1.01,2.1789440155029296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,1,power_law_1.01,2.1990848541259767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,1,power_law_1.2,2.1608320236206056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,1,power_law_1.2,2.168070411682129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,128,balanced,0.24033600091934204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,128,balanced,0.24041066567103067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,128,power_law_1.01,0.23867518901824952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,128,power_law_1.01,0.23900160789489747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,128,power_law_1.2,0.2381887912750244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,128,power_law_1.2,0.23892478942871093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,16,balanced,0.38583465417226154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,16,balanced,0.38756267229715985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,16,power_law_1.01,0.35624959468841555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,16,power_law_1.01,0.36620800495147704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,16,power_law_1.2,0.35301120281219484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,16,power_law_1.2,0.35996160507202146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,2,balanced,1.463930606842041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,2,balanced,1.5016746520996094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,2,power_law_1.01,1.2033663749694825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,2,power_law_1.01,1.2726783752441406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,2,power_law_1.2,1.1809344291687012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,2,power_law_1.2,1.1821503639221191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,32,balanced,0.3059999942779541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,32,balanced,0.30803734064102173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,32,power_law_1.01,0.2877887964248657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,32,power_law_1.01,0.2920383930206299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,32,power_law_1.2,0.28310399055480956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,32,power_law_1.2,0.2954047918319702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,4,balanced,0.8482080300649008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,4,balanced,0.84988800684611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,4,power_law_1.01,0.7322368144989013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,4,power_law_1.01,0.7785280227661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,4,power_law_1.2,0.7090432167053222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,4,power_law_1.2,0.7382847785949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,64,balanced,0.2561759948730469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,64,balanced,0.25883734226226807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,64,power_law_1.01,0.2506047964096069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,64,power_law_1.01,0.2540607929229736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,64,power_law_1.2,0.25112960338592527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,64,power_law_1.2,0.25282559394836424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,8,balanced,0.5442933241526285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,8,balanced,0.5455573399861654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,8,power_law_1.01,0.4806528091430664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,8,power_law_1.01,0.5094655990600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,8,power_law_1.2,0.4886784076690674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,1,8,power_law_1.2,0.5133696079254151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,16,1,balanced,0.3797333240509033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,16,1,balanced,0.37987732887268066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,16,1,power_law_1.01,0.34262399673461913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,16,1,power_law_1.01,0.342630410194397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,16,1,power_law_1.2,0.33919999599456785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,16,1,power_law_1.2,0.34072959423065186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,2,1,balanced,1.3776639302571614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,2,1,balanced,1.4078240394592285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,2,1,power_law_1.01,1.1277631759643554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,2,1,power_law_1.01,1.1366016387939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,2,1,power_law_1.2,1.1095616340637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,2,1,power_law_1.2,1.1177599906921387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,32,1,balanced,0.3233333428700765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,32,1,balanced,0.3253653248151143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,32,1,power_law_1.01,0.29240319728851316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,32,1,power_law_1.01,0.29285120964050293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,32,1,power_law_1.2,0.2907263994216919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,32,1,power_law_1.2,0.29154560565948484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,4,1,balanced,0.7857653299967448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,4,1,balanced,0.7901600201924642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,4,1,power_law_1.01,0.6599552154541015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,4,1,power_law_1.01,0.6671552181243896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,4,1,power_law_1.2,0.665119981765747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,4,1,power_law_1.2,0.6705535888671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,8,1,balanced,0.5173066854476929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,8,1,balanced,0.5179466803868612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,8,1,power_law_1.01,0.4380864143371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,8,1,power_law_1.01,0.4393343925476074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,8,1,power_law_1.2,0.43595519065856936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,256,7168,2048,8,384,8,1,power_law_1.2,0.4395904064178467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,1,balanced,0.3892853260040283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,1,balanced,0.39048532644907635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,1,power_law_1.01,0.4031167984008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,1,power_law_1.01,0.40799999237060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,1,power_law_1.2,0.4143871784210205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,1,power_law_1.2,0.41544318199157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,128,balanced,0.20345600446065268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,128,balanced,0.20351467529932657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,128,power_law_1.01,0.21164801120758056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,128,power_law_1.01,0.21281919479370118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,128,power_law_1.2,0.2174527883529663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,128,power_law_1.2,0.21893761157989503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,16,balanced,0.21798400084177652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,16,balanced,0.21822933355967203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,16,power_law_1.01,0.2256319999694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,16,power_law_1.01,0.22856318950653076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,16,power_law_1.2,0.2297663927078247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,16,power_law_1.2,0.2338560104370117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,2,balanced,0.31353600819905597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,2,balanced,0.3154346744219462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,2,power_law_1.01,0.3280832052230835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,2,power_law_1.01,0.3346879959106445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,2,power_law_1.2,0.3334784030914307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,2,power_law_1.2,0.33418879508972166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,32,balanced,0.20985066890716553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,32,balanced,0.20990399519602457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,32,power_law_1.01,0.21902079582214357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,32,power_law_1.01,0.22215039730072023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,32,power_law_1.2,0.22535040378570556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,32,power_law_1.2,0.22702720165252685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,4,balanced,0.2568160096804301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,4,balanced,0.26202134291330975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,4,power_law_1.01,0.2756927967071533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,4,power_law_1.01,0.2800640106201172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,4,power_law_1.2,0.2787519931793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,4,power_law_1.2,0.2835776090621948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,64,balanced,0.20558400948842367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,64,balanced,0.20629332462946573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,64,power_law_1.01,0.21185920238494874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,64,power_law_1.01,0.21285760402679443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,64,power_law_1.2,0.22322559356689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,64,power_law_1.2,0.22430720329284667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,8,balanced,0.23031999667485556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,8,balanced,0.23068267107009888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,8,power_law_1.01,0.24321279525756836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,8,power_law_1.01,0.24387838840484619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,8,power_law_1.2,0.24983038902282714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,1,8,power_law_1.2,0.2551424026489258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,2,1,balanced,0.27795199553171795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,2,1,balanced,0.27909332513809204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,2,1,power_law_1.01,0.2865407943725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,2,1,power_law_1.01,0.2875456094741821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,2,1,power_law_1.2,0.28830718994140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,2,1,power_law_1.2,0.29041280746459963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,4,1,balanced,0.2285226583480835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,4,1,balanced,0.2306613326072693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,4,1,power_law_1.01,0.23518080711364747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,4,1,power_law_1.01,0.2359231948852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,4,1,power_law_1.2,0.23902080059051514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2048,768,8,128,4,1,power_law_1.2,0.23959040641784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,1,balanced,0.8092479705810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,1,balanced,0.817792018254598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,1,power_law_1.01,0.7708159923553467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,1,power_law_1.01,0.7824512004852295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,1,power_law_1.2,0.795692777633667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,1,power_law_1.2,0.80447359085083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,128,balanced,0.2649493416150411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,128,balanced,0.2659733295440674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,128,power_law_1.01,0.2801919937133789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,128,power_law_1.01,0.2805952072143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,128,power_law_1.2,0.29460480213165285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,128,power_law_1.2,0.29614720344543455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,16,balanced,0.30316799879074097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,16,balanced,0.3034026622772217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,16,power_law_1.01,0.3129983901977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,16,power_law_1.01,0.32118399143218995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,16,power_law_1.2,0.3249023914337158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,16,power_law_1.2,0.3309760093688965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,2,balanced,0.5535893440246582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,2,balanced,0.5546826521555582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,2,power_law_1.01,0.5444672107696533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,2,power_law_1.01,0.5762368202209472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,2,power_law_1.2,0.5620672225952148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,2,power_law_1.2,0.5844031810760498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,32,balanced,0.28140799204508465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,32,balanced,0.2826026678085327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,32,power_law_1.01,0.30140159130096433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,32,power_law_1.01,0.3023551940917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,32,power_law_1.2,0.31265280246734617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,32,power_law_1.2,0.31900160312652587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,4,balanced,0.4143679936726888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,4,balanced,0.418015996615092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,4,power_law_1.01,0.42478079795837403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,4,power_law_1.01,0.4278656005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,4,power_law_1.2,0.43526401519775393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,4,power_law_1.2,0.43799681663513185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,64,balanced,0.2707786758740743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,64,balanced,0.27269866069157916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,64,power_law_1.01,0.28609280586242675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,64,power_law_1.01,0.2864831924438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,64,power_law_1.2,0.29485440254211426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,64,power_law_1.2,0.2994112014770508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,8,balanced,0.3424746592839559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,8,balanced,0.3450506528218587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,8,power_law_1.01,0.35973761081695554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,8,power_law_1.01,0.3630336046218872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,8,power_law_1.2,0.3682559967041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,1,8,power_law_1.2,0.3692095994949341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,16,1,balanced,1.5236105918884277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,16,1,balanced,1.5253705978393555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,16,1,power_law_1.01,1.386911964416504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,16,1,power_law_1.01,1.4141823768615722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,16,1,power_law_1.2,1.4319168090820313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,16,1,power_law_1.2,1.4384127616882325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,2,1,balanced,0.5136799812316895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,2,1,balanced,0.513861338297526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,2,1,power_law_1.01,0.48778882026672366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,2,1,power_law_1.01,0.49264001846313477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,2,1,power_law_1.2,0.5001152038574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,2,1,power_law_1.2,0.5034239768981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,32,1,balanced,1.319818655649821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,32,1,balanced,1.32204270362854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,32,1,power_law_1.01,1.2317119598388673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,32,1,power_law_1.01,1.2331904411315917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,32,1,power_law_1.2,1.258784008026123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,32,1,power_law_1.2,1.2605695724487305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,4,1,balanced,0.3582133452097575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,4,1,balanced,0.3595946629842122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,4,1,power_law_1.01,0.3465984106063843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,4,1,power_law_1.01,0.3518912076950073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,4,1,power_law_1.2,0.35145599842071534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,4,1,power_law_1.2,0.35180799961090087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,8,1,balanced,2.0398826599121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,8,1,balanced,2.062357266743978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,8,1,power_law_1.01,1.8288192749023438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,8,1,power_law_1.01,1.9097024917602539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,8,1,power_law_1.2,1.946054458618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,2688,1856,6,128,8,1,power_law_1.2,1.9481088638305664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,1,balanced,0.9636853535970052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,1,balanced,0.9795626799265543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,1,power_law_1.01,1.1215871810913085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,1,power_law_1.01,1.1231167793273926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,1,power_law_1.2,1.1644351959228516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,1,power_law_1.2,1.1655232429504394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,128,balanced,0.32654400666554767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,128,balanced,0.32842133442560834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,128,power_law_1.01,0.3414975881576538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,128,power_law_1.01,0.34330239295959475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,128,power_law_1.2,0.35145599842071534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,128,power_law_1.2,0.35326080322265624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,16,balanced,0.36801600456237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,16,balanced,0.3681013186772664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,16,power_law_1.01,0.3955071926116943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,16,power_law_1.01,0.40062718391418456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,16,power_law_1.2,0.4028800010681152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,16,power_law_1.2,0.4066688060760498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,2,balanced,0.6703200340270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,2,balanced,0.6717867056528727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,2,power_law_1.01,0.7546175956726074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,2,power_law_1.01,0.768620777130127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,2,power_law_1.2,0.799513578414917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,2,power_law_1.2,0.7995520114898682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,256,balanced,0.326474666595459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,256,balanced,0.32655467589696247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,256,power_law_1.01,0.3337599992752075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,256,power_law_1.01,0.33524479866027834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,256,power_law_1.2,0.34283521175384524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,256,power_law_1.2,0.3440959930419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,32,balanced,0.3442879915237427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,32,balanced,0.3444586594899495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,32,power_law_1.01,0.36462080478668213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,32,power_law_1.01,0.3646399974822998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,32,power_law_1.2,0.37141759395599366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,32,power_law_1.2,0.37355520725250246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,4,balanced,0.5046559969584147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,4,balanced,0.5062133471171061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,4,power_law_1.01,0.5524799823760986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,4,power_law_1.01,0.5630464076995849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,4,power_law_1.2,0.5864575862884521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,4,power_law_1.2,0.5884799957275391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,64,balanced,0.3317280014355977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,64,balanced,0.3335413138071696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,64,power_law_1.01,0.3476351976394653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,64,power_law_1.01,0.35061120986938477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,64,power_law_1.2,0.3589695930480957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,64,power_law_1.2,0.3595328092575073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,8,balanced,0.41465067863464355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,8,balanced,0.4147466818491618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,8,power_law_1.01,0.45421438217163085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,8,power_law_1.01,0.45664639472961427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,8,power_law_1.2,0.4709311962127686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,1,8,power_law_1.2,0.4729472160339355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,16,1,balanced,0.29371732473373413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,16,1,power_law_1.01,0.3330496072769165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,16,1,power_law_1.01,0.3332992076873779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,16,1,power_law_1.2,0.3383552074432373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,16,1,power_law_1.2,0.34000000953674314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,2,1,balanced,0.5980746746063232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,2,1,balanced,0.5983359813690186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,2,1,power_law_1.01,0.6871679782867431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,2,1,power_law_1.01,0.6942272186279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,2,1,power_law_1.2,0.7184063911437988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,2,1,power_law_1.2,0.7208896160125733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,32,1,balanced,0.2700693408648173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,32,1,balanced,0.27249600489934284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,32,1,power_law_1.01,0.3120448112487793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,32,1,power_law_1.01,0.3123456001281738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,32,1,power_law_1.2,0.3168895959854126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,32,1,power_law_1.2,0.318886399269104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,4,1,balanced,0.41788268089294434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,4,1,balanced,0.41897066434224445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,4,1,power_law_1.01,0.4696000099182129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,4,1,power_law_1.01,0.47642879486083983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,4,1,power_law_1.2,0.48491520881652833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,4,1,power_law_1.2,0.4890751838684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,8,1,balanced,0.3370240132013957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,8,1,balanced,0.33880531787872314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,8,1,power_law_1.01,0.3800895929336548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,8,1,power_law_1.01,0.3804800033569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,8,1,power_law_1.2,0.3907263994216919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,3072,1536,8,256,8,1,power_law_1.2,0.3917695999145508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,1,balanced,1.4474986394246419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,1,balanced,1.4543360074361165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,1,power_law_1.01,1.483334445953369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,1,power_law_1.01,1.5042943954467773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,1,power_law_1.2,1.5159168243408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,1,power_law_1.2,1.5211968421936035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,2,balanced,0.921994686126709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,2,balanced,0.9256213506062826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,2,power_law_1.01,1.103052806854248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,2,power_law_1.01,1.1072896003723145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,2,power_law_1.2,1.0811264038085937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,2,power_law_1.2,1.1584063529968263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,4,balanced,0.6720373630523682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,4,balanced,0.6790719827016195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,4,power_law_1.01,0.9700223922729492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,4,power_law_1.01,0.9889151573181152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,4,power_law_1.2,0.8894911766052246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,4,power_law_1.2,1.0910847663879395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,8,balanced,0.5378773212432861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,8,balanced,0.5385813315709432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,8,power_law_1.01,0.8546303749084473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,8,power_law_1.01,0.8695872306823731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,8,power_law_1.2,0.8464384078979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,1,8,power_law_1.2,0.8542847633361816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,16,1,balanced,0.18120000759760538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,16,1,balanced,0.18122132619222006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,16,1,power_law_1.01,0.18261120319366456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,16,1,power_law_1.01,0.18301440477371217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,16,1,power_law_1.2,0.18122880458831786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,16,1,power_law_1.2,0.1823807954788208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,2,1,balanced,0.7622293631235758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,2,1,balanced,0.7639146645863851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,2,1,power_law_1.01,0.7850048065185546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,2,1,power_law_1.01,0.797811222076416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,2,1,power_law_1.2,0.7768320083618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,2,1,power_law_1.2,0.7838912010192871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,32,1,balanced,0.14591999848683676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,32,1,balanced,0.14711466431617737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,32,1,power_law_1.01,0.14736640453338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,32,1,power_law_1.01,0.14748799800872803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,32,1,power_law_1.2,0.14677759408950805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,32,1,power_law_1.2,0.14967679977416992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,4,1,balanced,0.4166773160298665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,4,1,balanced,0.4268960158030192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,4,1,power_law_1.01,0.4218624114990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,4,1,power_law_1.01,0.42495360374450686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,4,1,power_law_1.2,0.4227456092834473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,4,1,power_law_1.2,0.4320511817932129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,8,1,balanced,0.251525342464447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,8,1,balanced,0.2552853425343831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,8,1,power_law_1.01,0.2576575994491577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,8,1,power_law_1.01,0.2644736051559448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,8,1,power_law_1.2,0.259935998916626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,14336,2,8,8,1,power_law_1.2,0.2623039960861206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,1,balanced,1.003002643585205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,1,balanced,1.0128586292266846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,1,power_law_1.01,1.065939235687256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,1,power_law_1.01,1.0744640350341796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,1,power_law_1.2,1.0828288078308106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,1,power_law_1.2,1.0904128074645996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,128,balanced,0.33879466851552326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,128,balanced,0.3389600118001302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,128,power_law_1.01,0.36341118812561035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,128,power_law_1.01,0.3646656036376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,128,power_law_1.2,0.37832961082458494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,128,power_law_1.2,0.39001600742340087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,16,balanced,0.38038400808970135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,16,balanced,0.3805653254191081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,16,power_law_1.01,0.40787839889526367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,16,power_law_1.01,0.4133632183074951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,16,power_law_1.2,0.43476481437683107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,16,power_law_1.2,0.4416192054748535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,2,balanced,0.6986560026804606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,2,balanced,0.6996373335520426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,2,power_law_1.01,0.7626239776611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,2,power_law_1.01,0.7783936023712158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,2,power_law_1.2,0.7576831817626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,2,power_law_1.2,0.7885951995849609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,32,balanced,0.35549334685007733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,32,balanced,0.35681601365407306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,32,power_law_1.01,0.39253759384155273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,32,power_law_1.01,0.39653759002685546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,32,power_law_1.2,0.3968127965927124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,32,power_law_1.2,0.4108287811279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,4,balanced,0.5205493370691935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,4,balanced,0.5209920008977255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,4,power_law_1.01,0.5527103900909424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,4,power_law_1.01,0.5646143913269043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,4,power_law_1.2,0.593017578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,4,power_law_1.2,0.6089920043945313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,64,balanced,0.34303466478983563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,64,balanced,0.34386666615804035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,64,power_law_1.01,0.37097599506378176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,64,power_law_1.01,0.3743488073348999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,64,power_law_1.2,0.3857599973678589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,64,power_law_1.2,0.39152638912200927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,8,balanced,0.42685866355895996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,8,balanced,0.428111990292867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,8,power_law_1.01,0.4637440204620361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,8,power_law_1.01,0.4733248233795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,8,power_law_1.2,0.47630720138549804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,1,8,power_law_1.2,0.48787198066711424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,16,1,balanced,0.3331786592801412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,16,1,balanced,0.3343413273493449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,16,1,power_law_1.01,0.34437758922576905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,16,1,power_law_1.01,0.34565761089324953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,16,1,power_law_1.2,0.3460864067077637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,16,1,power_law_1.2,0.34736640453338624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,2,1,balanced,0.6456106503804525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,2,1,balanced,0.6485439936319987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,2,1,power_law_1.01,0.6737599849700928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,2,1,power_law_1.01,0.6808703899383545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,2,1,power_law_1.2,0.6866559982299805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,2,1,power_law_1.2,0.6869440078735352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,32,1,balanced,0.3102453351020813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,32,1,balanced,0.31056533257166546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,32,1,power_law_1.01,0.31988480091094973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,32,1,power_law_1.01,0.3208064079284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,32,1,power_law_1.2,0.32222719192504884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,32,1,power_law_1.2,0.32264959812164307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,4,1,balanced,0.4601279894510905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,4,1,balanced,0.46085866292317706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,4,1,power_law_1.01,0.47318401336669924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,4,1,power_law_1.01,0.47630720138549804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,4,1,power_law_1.2,0.4789567947387695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,4,1,power_law_1.2,0.4799808025360107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,8,1,balanced,0.37823466459910077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,8,1,balanced,0.37832534313201904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,8,1,power_law_1.01,0.3877120018005371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,8,1,power_law_1.01,0.39010560512542725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,8,1,power_law_1.2,0.3936448097229004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,1536,8,128,8,1,power_law_1.2,0.3940608024597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,1,balanced,6.282485326131185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,1,balanced,6.339829126993815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,1,power_law_1.01,5.759500885009766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,1,power_law_1.01,5.893657684326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,1,power_law_1.2,5.915641784667969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,1,power_law_1.2,6.068928146362305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,128,balanced,1.2148586908976238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,128,balanced,1.2148799896240234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,128,power_law_1.01,1.2492223739624024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,128,power_law_1.01,1.2547007560729981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,128,power_law_1.2,1.2728384017944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,128,power_law_1.2,1.2777471542358398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,16,balanced,1.4768800735473633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,16,balanced,1.4825280507405598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,16,power_law_1.01,1.4974016189575194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,16,power_law_1.01,1.5137151718139648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,16,power_law_1.2,1.5444479942321778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,16,power_law_1.2,1.55796480178833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,2,balanced,3.5783678690592446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,2,balanced,3.680239995320638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,2,power_law_1.01,3.4459903717041014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,2,power_law_1.01,3.4563518524169923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,2,power_law_1.2,3.496473693847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,2,power_law_1.2,3.545171356201172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,256,balanced,1.1950613657633464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,256,balanced,1.1953333218892415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,256,power_law_1.01,1.2222847938537598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,256,power_law_1.01,1.2317184448242187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,256,power_law_1.2,1.2412544250488282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,256,power_law_1.2,1.266214370727539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,32,balanced,1.3295040130615234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,32,balanced,1.3347892761230469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,32,power_law_1.01,1.3681407928466798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,32,power_law_1.01,1.375667190551758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,32,power_law_1.2,1.3940671920776366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,32,power_law_1.2,1.4113344192504882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,4,balanced,2.3388214111328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,4,balanced,2.3533493677775064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,4,power_law_1.01,2.3303232192993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,4,power_law_1.01,2.3614015579223633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,4,power_law_1.2,2.3995328903198243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,4,power_law_1.2,2.41092472076416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,64,balanced,1.2526986598968506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,64,balanced,1.2530506451924641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,64,power_law_1.01,1.290982437133789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,64,power_law_1.01,1.2995264053344726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,64,power_law_1.2,1.3211775779724122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,64,power_law_1.2,1.3402815818786622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,8,balanced,1.7720266977945964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,8,balanced,1.7743786176045735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,8,power_law_1.01,1.8141056060791017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,8,power_law_1.01,1.815488052368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,8,power_law_1.2,1.8518848419189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,1,8,power_law_1.2,1.8700223922729493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,16,1,balanced,10.780170440673828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,16,1,balanced,11.035082499186197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,16,1,power_law_1.01,10.093836975097656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,16,1,power_law_1.01,10.133299255371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,16,1,power_law_1.2,10.448627471923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,16,1,power_law_1.2,10.54358367919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,2,1,balanced,3.514394760131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,2,1,balanced,3.648144086201986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,2,1,power_law_1.01,3.094483184814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,2,1,power_law_1.01,3.1589824676513674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,2,1,power_law_1.2,3.228441619873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,2,1,power_law_1.2,3.2590206146240233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,32,1,balanced,7.89459228515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,32,1,balanced,7.955312093098958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,32,1,power_law_1.01,7.003212738037109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,32,1,power_law_1.01,7.089849853515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,32,1,power_law_1.2,7.211238098144531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,32,1,power_law_1.2,7.256889343261719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,4,1,balanced,2.135711987813314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,4,1,balanced,2.14520533879598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,4,1,power_law_1.01,1.9685888290405273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,4,1,power_law_1.01,1.988684844970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,4,1,power_law_1.2,2.0077184677124023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,4,1,power_law_1.2,2.0161663055419923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,8,1,balanced,1.4905440012613933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,8,1,balanced,1.4947840372721355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,8,1,power_law_1.01,1.3745216369628905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,8,1,power_law_1.01,1.3811264038085938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,8,1,power_law_1.2,1.4080063819885253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,4096,2688,22,512,8,1,power_law_1.2,1.408902359008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,1,balanced,2.3127573331197104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,1,balanced,2.3180267016092935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,1,power_law_1.01,2.363462448120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,1,power_law_1.01,2.407980728149414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,1,power_law_1.2,2.353753662109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,1,power_law_1.2,2.392793655395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,2,balanced,1.3333919843037922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,2,balanced,1.357632001241048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,2,power_law_1.01,1.72412166595459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,2,power_law_1.01,1.7670528411865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,2,power_law_1.2,1.6049856185913085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,2,power_law_1.2,1.697804832458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,4,balanced,0.854581356048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,4,balanced,0.8673386573791504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,4,power_law_1.01,1.3901823997497558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,4,power_law_1.01,1.4267711639404297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,4,power_law_1.2,1.4132096290588378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,4,power_law_1.2,1.4463295936584473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,8,balanced,0.6607626676559448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,8,balanced,0.6642080148061117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,8,power_law_1.01,1.133683204650879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,8,power_law_1.01,1.2866623878479004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,8,power_law_1.2,1.2250304222106934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,1,8,power_law_1.2,1.2898176193237305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,16,1,balanced,0.25062400102615356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,16,1,balanced,0.25165865818659466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,16,1,power_law_1.01,0.257804799079895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,16,1,power_law_1.01,0.260646390914917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,16,1,power_law_1.2,0.25546879768371583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,16,1,power_law_1.2,0.2599679946899414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,2,1,balanced,1.133845329284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,2,1,balanced,1.1503146489461262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,2,1,power_law_1.01,1.2253120422363282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,2,1,power_law_1.01,1.2470720291137696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,2,1,power_law_1.2,1.2301631927490235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,2,1,power_law_1.2,1.2456512451171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,32,1,balanced,0.19350399573644003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,32,1,balanced,0.19629865884780884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,32,1,power_law_1.01,0.19952640533447266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,32,1,power_law_1.01,0.201094388961792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,32,1,power_law_1.2,0.19994879961013795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,32,1,power_law_1.2,0.20195839405059815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,4,1,balanced,0.625930666923523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,4,1,balanced,0.6362400054931641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,4,1,power_law_1.01,0.663424015045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,4,1,power_law_1.01,0.6721343994140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,4,1,power_law_1.2,0.6571584224700928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,4,1,power_law_1.2,0.674892807006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,8,1,balanced,0.37854933738708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,8,1,balanced,0.3838133414586385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,8,1,power_law_1.01,0.3867583990097046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,8,1,power_law_1.01,0.39613440036773684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,8,1,power_law_1.2,0.3874943971633911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,16384,2,8,8,1,power_law_1.2,0.39045760631561277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,1,balanced,2.1928000450134277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,1,balanced,2.2919467290242515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,1,power_law_1.01,2.6940544128417967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,1,power_law_1.01,2.700601577758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,1,power_law_1.2,2.8483327865600585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,1,power_law_1.2,2.8565887451171874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,128,balanced,0.5130399862925211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,128,balanced,0.5145119825998942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,128,power_law_1.01,0.5422336101531983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,128,power_law_1.01,0.5462399959564209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,128,power_law_1.2,0.5721792221069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,128,power_law_1.2,0.5721920013427735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,16,balanced,0.6144426663716634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,16,balanced,0.6171199878056844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,16,power_law_1.01,0.6804160118103028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,16,power_law_1.01,0.6936448097229004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,16,power_law_1.2,0.6975808143615723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,16,power_law_1.2,0.7194496154785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,2,balanced,1.4004747072855632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,2,balanced,1.4038987159729004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,2,power_law_1.01,1.6360383987426759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,2,power_law_1.01,1.64019832611084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,2,power_law_1.2,1.6929407119750977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,2,power_law_1.2,1.7145280838012695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,256,balanced,0.5082346598307291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,256,balanced,0.5105706850687662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,256,power_law_1.01,0.5340479850769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,256,power_law_1.01,0.5362175941467285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,256,power_law_1.2,0.5537407875061036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,256,power_law_1.2,0.5539455890655518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,32,balanced,0.555242657661438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,32,balanced,0.5565439860026041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,32,power_law_1.01,0.6085247993469238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,32,power_law_1.01,0.6096704006195068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,32,power_law_1.2,0.6246592044830322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,32,power_law_1.2,0.6447296142578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,4,balanced,0.9545866648356119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,4,balanced,0.9596319993336996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,4,power_law_1.01,1.1023103713989257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,4,power_law_1.01,1.1417344093322754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,4,power_law_1.2,1.1339008331298828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,4,power_law_1.2,1.1387455940246582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,64,balanced,0.5253973404566447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,64,balanced,0.5283786853154501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,64,power_law_1.01,0.5661632061004639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,64,power_law_1.01,0.5703487873077393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,64,power_law_1.2,0.5892159938812256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,64,power_law_1.2,0.5930560111999512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,8,balanced,0.7251839637756348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,8,balanced,0.7310026486714681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,8,power_law_1.01,0.8091903686523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,8,power_law_1.01,0.836518383026123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,8,power_law_1.2,0.8428671836853028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,1,8,power_law_1.2,0.8766783714294434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,16,1,balanced,0.5171573162078857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,16,1,balanced,0.5178133249282837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,16,1,power_law_1.01,0.5923264026641846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,16,1,power_law_1.01,0.5962495803833008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,16,1,power_law_1.2,0.6050559997558593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,16,1,power_law_1.2,0.6070400238037109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,2,1,balanced,1.2849546273549397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,2,1,balanced,1.2937653064727783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,2,1,power_law_1.01,1.5092608451843261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,2,1,power_law_1.01,1.5178048133850097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,2,1,power_law_1.2,1.5579456329345702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,2,1,power_law_1.2,1.563321590423584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,32,1,balanced,0.4715893268585205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,32,1,balanced,0.47381333510080975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,32,1,power_law_1.01,0.5503615856170654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,32,1,power_law_1.01,0.5516672134399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,32,1,power_law_1.2,0.5601600170135498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,32,1,power_law_1.2,0.562227201461792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,4,1,balanced,0.8270400365193685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,4,1,balanced,0.8285866578420004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,4,1,power_law_1.01,0.9754303932189942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,4,1,power_law_1.01,0.9795519828796386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,4,1,power_law_1.2,1.001798439025879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,4,1,power_law_1.2,1.0075391769409179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,8,1,balanced,0.6270933151245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,8,1,balanced,0.629045327504476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,8,1,power_law_1.01,0.7208000183105469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,8,1,power_law_1.01,0.7241536140441894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,8,1,power_law_1.2,0.7404736042022705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2048,8,256,8,1,power_law_1.2,0.7414720058441162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,1,balanced,2.805295944213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,1,balanced,2.8691466649373374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,1,power_law_1.01,2.5403072357177736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,1,power_law_1.01,2.5464960098266602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,1,power_law_1.2,2.6096319198608398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,1,power_law_1.2,2.637785530090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,16,balanced,0.645466685295105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,16,balanced,0.6474560101826986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,16,power_law_1.01,0.69966721534729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,16,power_law_1.01,0.7165696144104003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,16,power_law_1.2,0.7298367977142334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,16,power_law_1.2,0.7358975887298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,2,balanced,1.5990667343139648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,2,balanced,1.6120853424072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,2,power_law_1.01,1.6397504806518555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,2,power_law_1.01,1.6955583572387696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,2,power_law_1.2,1.6321599960327149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,2,power_law_1.2,1.683795166015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,32,balanced,0.5742239952087402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,32,balanced,0.57423468430837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,32,power_law_1.01,0.6280447959899902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,32,power_law_1.01,0.6400063991546631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,32,power_law_1.2,0.6576704025268555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,32,power_law_1.2,0.6764480113983155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,4,balanced,1.0530026753743489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,4,balanced,1.0580906867980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,4,power_law_1.01,1.1029824256896972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,4,power_law_1.01,1.1055551528930665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,4,power_law_1.2,1.0785087585449218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,4,power_law_1.2,1.1590527534484862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,8,balanced,0.781173308690389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,8,balanced,0.7826399803161621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,8,power_law_1.01,0.8297599792480469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,8,power_law_1.01,0.8359744071960449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,8,power_law_1.2,0.8741120338439942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,1,8,power_law_1.2,0.9200384140014648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,16,1,balanced,0.5929760138193766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,16,1,balanced,0.5934666792551676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,16,1,power_law_1.01,0.5818880081176758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,16,1,power_law_1.01,0.5840640068054199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,16,1,power_law_1.2,0.5857471942901611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,16,1,power_law_1.2,0.5898047924041748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,2,1,balanced,1.508314609527588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,2,1,balanced,1.510874589284261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,2,1,power_law_1.01,1.4573760032653809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,2,1,power_law_1.01,1.4713472366333007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,2,1,power_law_1.2,1.4986751556396485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,2,1,power_law_1.2,1.5044416427612304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,32,1,balanced,0.5288213491439819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,32,1,balanced,0.529210646947225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,32,1,power_law_1.01,0.5196800231933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,32,1,power_law_1.01,0.5214655876159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,32,1,power_law_1.2,0.5268735885620117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,32,1,power_law_1.2,0.5271552085876465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,4,1,balanced,0.9501919746398926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,4,1,balanced,0.9543039798736572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,4,1,power_law_1.01,0.939078426361084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,4,1,power_law_1.01,0.9400383949279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,4,1,power_law_1.2,0.9462719917297363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,4,1,power_law_1.2,0.9494463920593261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,8,1,balanced,0.6921706994374593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,8,1,balanced,0.6926506360371908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,8,1,power_law_1.01,0.681606388092041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,8,1,power_law_1.01,0.6846784114837646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,8,1,power_law_1.2,0.688921594619751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,6144,2560,8,160,8,1,power_law_1.2,0.6903488159179687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,1,balanced,2.6646453539530435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,1,balanced,2.726223945617676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,1,power_law_1.01,3.1161855697631835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,1,power_law_1.01,3.1951936721801757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,1,power_law_1.2,3.237459182739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,1,power_law_1.2,3.3228992462158202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,128,balanced,0.5609920024871826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,128,balanced,0.5634719928105673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,128,power_law_1.01,0.5930431842803955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,128,power_law_1.01,0.5938111782073975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,128,power_law_1.2,0.6160895824432373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,128,power_law_1.2,0.6190976142883301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,16,balanced,0.6820533275604248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,16,balanced,0.6824053128560384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,16,power_law_1.01,0.7587584018707275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,16,power_law_1.01,0.770195198059082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,16,power_law_1.2,0.8033920288085937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,16,power_law_1.2,0.8222911834716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,2,balanced,1.5984959602355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,2,balanced,1.6271947224934895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,2,power_law_1.01,1.8576576232910156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,2,power_law_1.01,1.8616704940795898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,2,power_law_1.2,1.925811195373535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,2,power_law_1.2,1.9264640808105469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,256,balanced,0.5558773279190063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,256,balanced,0.5575999816258749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,256,power_law_1.01,0.5815999984741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,256,power_law_1.01,0.5852223873138428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,256,power_law_1.2,0.6036992073059082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,256,power_law_1.2,0.6115327835083008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,32,balanced,0.6103786627451578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,32,balanced,0.6112320025761923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,32,power_law_1.01,0.666323184967041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,32,power_law_1.01,0.67674880027771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,32,power_law_1.2,0.6971776008605957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,32,power_law_1.2,0.7228608131408691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,4,balanced,1.0748266379038494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,4,balanced,1.0763946374257405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,4,power_law_1.01,1.2548288345336913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,4,power_law_1.01,1.2684351921081543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,4,power_law_1.2,1.273158359527588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,4,power_law_1.2,1.294604778289795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,64,balanced,0.5739519993464152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,64,balanced,0.5762293338775635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,64,power_law_1.01,0.6225088119506836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,64,power_law_1.01,0.6307136058807373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,64,power_law_1.2,0.635430383682251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,64,power_law_1.2,0.638969612121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,8,balanced,0.8113226890563965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,8,balanced,0.8141866525014242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,8,power_law_1.01,0.9141311645507812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,8,power_law_1.01,0.9364543914794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,8,power_law_1.2,0.9713088035583496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,1,8,power_law_1.2,0.9747008323669434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,16,1,balanced,0.5899626811345419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,16,1,balanced,0.5903840065002441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,16,1,power_law_1.01,0.6797887802124023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,16,1,power_law_1.01,0.6813119888305664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,16,1,power_law_1.2,0.6900288105010987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,16,1,power_law_1.2,0.6950719833374024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,2,1,balanced,1.485978603363037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,2,1,balanced,1.4912746747334797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,2,1,power_law_1.01,1.7315071105957032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,2,1,power_law_1.01,1.7493888854980468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,2,1,power_law_1.2,1.8010623931884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,2,1,power_law_1.2,1.8023103713989257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,32,1,balanced,0.5380213260650635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,32,1,balanced,0.5387093226114908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,32,1,power_law_1.01,0.630457592010498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,32,1,power_law_1.01,0.6315839767456055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,32,1,power_law_1.2,0.6434175968170166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,32,1,power_law_1.2,0.6470272064208984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,4,1,balanced,0.9478773276011149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,4,1,balanced,0.9499680201212565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,4,1,power_law_1.01,1.1266112327575684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,4,1,power_law_1.01,1.1270784378051757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,4,1,power_law_1.2,1.150163173675537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,4,1,power_law_1.2,1.157478427886963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,8,1,balanced,0.7186079819997152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,8,1,balanced,0.7186453342437744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,8,1,power_law_1.01,0.824185562133789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,8,1,power_law_1.01,0.8312000274658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,8,1,power_law_1.2,0.8486720085144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,256,8,1,power_law_1.2,0.8516287803649902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,1,balanced,3.8292318979899087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,1,balanced,3.8525546391805015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,1,power_law_1.01,4.039334487915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,1,power_law_1.01,4.193427276611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,1,power_law_1.2,4.155219268798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,1,power_law_1.2,4.224646377563476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,128,balanced,0.6248053312301636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,128,balanced,0.6255253156026205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,128,power_law_1.01,0.6570943832397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,128,power_law_1.01,0.6585855960845948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,128,power_law_1.2,0.6784319877624512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,128,power_law_1.2,0.6806719779968262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,16,balanced,0.8002879619598389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,16,balanced,0.8017439842224121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,16,power_law_1.01,0.8553600311279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,16,power_law_1.01,0.8722944259643555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,16,power_law_1.2,0.8943552017211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,16,power_law_1.2,0.8987135887145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,2,balanced,2.204784075419108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,2,balanced,2.2099040349324546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,2,power_law_1.01,2.2681983947753905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,2,power_law_1.01,2.33492488861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,2,power_law_1.2,2.3621440887451173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,2,power_law_1.2,2.369094467163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,32,balanced,0.7016106446584066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,32,balanced,0.7017920017242432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,32,power_law_1.01,0.7408383846282959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,32,power_law_1.01,0.7493375778198242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,32,power_law_1.2,0.7667520046234131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,32,power_law_1.2,0.7672704219818115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,4,balanced,1.3708426157633464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,4,balanced,1.37227201461792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,4,power_law_1.01,1.4700991630554199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,4,power_law_1.01,1.4735424041748046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,4,power_law_1.2,1.523475170135498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,4,power_law_1.2,1.5438655853271483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,64,balanced,0.6491733392079672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,64,balanced,0.6499306758244833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,64,power_law_1.01,0.6880576133728027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,64,power_law_1.01,0.6976511955261231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,64,power_law_1.2,0.7016767978668212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,64,power_law_1.2,0.7025152206420898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,8,balanced,0.9957119623819987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,8,balanced,0.9978559811909994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,8,power_law_1.01,1.0614399909973145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,8,power_law_1.01,1.0681856155395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,8,power_law_1.2,1.089145565032959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,1,8,power_law_1.2,1.125984001159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,16,1,balanced,0.7546613216400146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,16,1,balanced,0.7566506862640381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,16,1,power_law_1.01,0.8050687789916993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,16,1,power_law_1.01,0.8110336303710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,16,1,power_law_1.2,0.8333760261535644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,16,1,power_law_1.2,0.8402239799499511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,2,1,balanced,2.0163787206014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,2,1,balanced,2.073578675587972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,2,1,power_law_1.01,2.152672004699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,2,1,power_law_1.01,2.1843584060668944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,2,1,power_law_1.2,2.2634111404418946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,2,1,power_law_1.2,2.2757503509521486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,32,1,balanced,0.6929173469543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,32,1,balanced,0.6955733299255371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,32,1,power_law_1.01,0.7225152015686035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,32,1,power_law_1.01,0.7285823822021484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,32,1,power_law_1.2,0.745088005065918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,32,1,power_law_1.2,0.7487808227539062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,4,1,balanced,1.2790239651997883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,4,1,balanced,1.2821119626363118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,4,1,power_law_1.01,1.3532032012939452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,4,1,power_law_1.01,1.361734390258789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,4,1,power_law_1.2,1.4179200172424316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,4,1,power_law_1.2,1.4229887962341308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,8,1,balanced,0.9370933373769125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,8,1,balanced,0.9398667017618815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,8,1,power_law_1.01,0.984108829498291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,8,1,power_law_1.01,0.9888704299926758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,8,1,power_law_1.2,1.0203968048095704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,3072,7168,2048,8,384,8,1,power_law_1.2,1.0232959747314454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,1,balanced,0.13378666838010153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,1,balanced,0.1343786617120107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,1,power_law_1.01,0.11307519674301147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,1,power_law_1.01,0.11580159664154052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,1,power_law_1.2,0.11696640253067017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,1,power_law_1.2,0.11737600564956666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,128,balanced,0.029338667790095013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,128,balanced,0.0315733328461647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,128,power_law_1.01,0.028960001468658448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,128,power_law_1.01,0.03020159900188446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,128,power_law_1.2,0.02895359992980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,128,power_law_1.2,0.02919679880142212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,16,balanced,0.035232000052928925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,16,balanced,0.03548266738653183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,16,power_law_1.01,0.03317759931087494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,16,power_law_1.01,0.033228799700737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,16,power_law_1.2,0.03240959942340851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,16,power_law_1.2,0.033164799213409424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,2,balanced,0.0888266662756602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,2,balanced,0.09091732899347942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,2,power_law_1.01,0.08242560029029847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,2,power_law_1.01,0.08518400192260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,2,power_law_1.2,0.08325759768486023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,2,power_law_1.2,0.08430079817771911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,32,balanced,0.03142400085926056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,32,balanced,0.03215466688076655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,32,power_law_1.01,0.02993920147418976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,32,power_law_1.01,0.030700799822807313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,32,power_law_1.2,0.030393600463867188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,32,power_law_1.2,0.030752000212669373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,4,balanced,0.05938133100668589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,4,balanced,0.06018666426340739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,4,power_law_1.01,0.05423359870910645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,4,power_law_1.01,0.05488640069961548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,4,power_law_1.2,0.0543936014175415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,4,power_law_1.2,0.055692797899246214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,64,balanced,0.031504000226656594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,64,balanced,0.03166399896144867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,64,power_law_1.01,0.02906239926815033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,64,power_law_1.01,0.02990719974040985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,64,power_law_1.2,0.02963840067386627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,64,power_law_1.2,0.029811200499534608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,8,balanced,0.04172799984614054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,8,balanced,0.041749333341916404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,8,power_law_1.01,0.03759360015392303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,8,power_law_1.01,0.03925119936466217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,8,power_law_1.2,0.03857280015945434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,1,8,power_law_1.2,0.039776000380516055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,2,1,balanced,0.08902933200200398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,2,1,balanced,0.09093333284060161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,2,1,power_law_1.01,0.08188160061836243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,2,1,power_law_1.01,0.08384000062942505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,2,1,power_law_1.2,0.08142719864845276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,2,1,power_law_1.2,0.08260480165481568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,4,1,balanced,0.06257600088914235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,4,1,balanced,0.06354666749636333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,4,1,power_law_1.01,0.05685120224952698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,4,1,power_law_1.01,0.057792001962661745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,4,1,power_law_1.2,0.05583360195159912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2048,768,8,128,4,1,power_law_1.2,0.0574400007724762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,1,balanced,0.3275573253631592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,1,balanced,0.3280693292617798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,1,power_law_1.01,0.2587712049484253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,1,power_law_1.01,0.260646390914917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,1,power_law_1.2,0.2552000045776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,1,power_law_1.2,0.26190719604492185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,128,balanced,0.033615998923778534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,128,balanced,0.03532800078392029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,128,power_law_1.01,0.033657601475715636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,128,power_law_1.01,0.03369599878787995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,128,power_law_1.2,0.03344640135765076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,128,power_law_1.2,0.03451519906520843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,16,balanced,0.055386667450269066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,16,balanced,0.05611733098824819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,16,power_law_1.01,0.05047680139541626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,16,power_law_1.01,0.0537280023097992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,16,power_law_1.2,0.05082880258560181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,16,power_law_1.2,0.052691197395324706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,2,balanced,0.1855306625366211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,2,balanced,0.1865653395652771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,2,power_law_1.01,0.1562432050704956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,2,power_law_1.01,0.1568063974380493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,2,power_law_1.2,0.147052800655365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,2,power_law_1.2,0.1568063974380493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,32,balanced,0.039808000127474465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,32,balanced,0.03982399900754293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,32,power_law_1.01,0.03877759873867035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,32,power_law_1.01,0.03893119990825653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,32,power_law_1.2,0.03858560025691986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,32,power_law_1.2,0.038700801134109494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,4,balanced,0.1160533328851064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,4,balanced,0.11685333649317424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,4,power_law_1.01,0.10566400289535523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,4,power_law_1.01,0.10614399909973145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,4,power_law_1.2,0.10026240348815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,4,power_law_1.2,0.10552959442138672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,64,balanced,0.03766400118668874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,64,balanced,0.03789866715669632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,64,power_law_1.01,0.03589119911193848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,64,power_law_1.01,0.036032000184059144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,64,power_law_1.2,0.0364544004201889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,64,power_law_1.2,0.036883199214935304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,8,balanced,0.07745600243409474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,8,balanced,0.07842666904131572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,8,power_law_1.01,0.06984959840774536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,8,power_law_1.01,0.070796799659729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,8,power_law_1.2,0.06752640008926392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,1,8,power_law_1.2,0.07255039811134338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,16,1,balanced,0.21386667092641196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,16,1,balanced,0.21602133909861246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,16,1,power_law_1.01,0.16346240043640137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,16,1,power_law_1.01,0.1655743956565857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,16,1,power_law_1.2,0.16293120384216309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,16,1,power_law_1.2,0.16965759992599488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,2,1,balanced,0.1874826749165853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,2,1,balanced,0.18950400749842325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,2,1,power_law_1.01,0.15175679922103882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,2,1,power_law_1.01,0.15219839811325073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,2,1,power_law_1.2,0.14961279630661012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,2,1,power_law_1.2,0.1508095979690552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,32,1,balanced,0.1930933396021525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,32,1,balanced,0.19365866978963217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,32,1,power_law_1.01,0.1512063980102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,32,1,power_law_1.01,0.15419520139694215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,32,1,power_law_1.2,0.15061119794845582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,32,1,power_law_1.2,0.15086079835891725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,4,1,balanced,0.11931199828783672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,4,1,balanced,0.11984533071517944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,4,1,power_law_1.01,0.1028223991394043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,4,1,power_law_1.01,0.10401920080184937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,4,1,power_law_1.2,0.1003648042678833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,4,1,power_law_1.2,0.10146559476852417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,8,1,balanced,0.2574453353881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,8,1,balanced,0.25755200783411664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,8,1,power_law_1.01,0.20391039848327636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,8,1,power_law_1.01,0.20519680976867677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,8,1,power_law_1.2,0.19667199850082398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,2688,1856,6,128,8,1,power_law_1.2,0.2036736011505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,1,balanced,0.5764906803766886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,1,balanced,0.6605066855748495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,1,power_law_1.01,0.3120575904846191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,1,power_law_1.01,0.3176383972167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,1,power_law_1.2,0.28949120044708254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,1,power_law_1.2,0.29114880561828616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,128,balanced,0.037477334340413414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,128,balanced,0.037674665451049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,128,power_law_1.01,0.03641600012779236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,128,power_law_1.01,0.036857599020004274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,128,power_law_1.2,0.03670400083065033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,128,power_law_1.2,0.037401598691940305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,16,balanced,0.07474133372306824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,16,balanced,0.07554133236408234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,16,power_law_1.01,0.058143997192382814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,16,power_law_1.01,0.06284800171852112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,16,power_law_1.2,0.06177279949188232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,16,power_law_1.2,0.062080001831054686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,2,balanced,0.31616000334421795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,2,balanced,0.3165760040283203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,2,power_law_1.01,0.19258240461349488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,2,power_law_1.01,0.19333759546279908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,2,power_law_1.2,0.17204480171203612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,2,power_law_1.2,0.18920960426330566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,256,balanced,0.036303999523321785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,256,balanced,0.037471999724706016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,256,power_law_1.01,0.03550719916820526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,256,power_law_1.01,0.03573760092258453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,256,power_law_1.2,0.03527039885520935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,256,power_law_1.2,0.03531520068645477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,32,balanced,0.055029332637786865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,32,balanced,0.056794668237368263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,32,power_law_1.01,0.05027840137481689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,32,power_law_1.01,0.05415679812431336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,32,power_law_1.2,0.04737280011177063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,32,power_law_1.2,0.05120000243186951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,4,balanced,0.18011732896169028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,4,balanced,0.18131200472513834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,4,power_law_1.01,0.11918720006942748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,4,power_law_1.01,0.1424831986427307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,4,power_law_1.2,0.1334272027015686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,4,power_law_1.2,0.1449087977409363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,64,balanced,0.04142933338880539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,64,balanced,0.041850666205088295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,64,power_law_1.01,0.04010879993438721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,64,power_law_1.01,0.04071039855480194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,64,power_law_1.2,0.03863039910793305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,64,power_law_1.2,0.040454399585723874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,8,balanced,0.1141919990380605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,8,balanced,0.11565333604812622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,8,power_law_1.01,0.10145280361175538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,8,power_law_1.01,0.10280959606170655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,8,power_law_1.2,0.08515200018882751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,1,8,power_law_1.2,0.10181119441986083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,16,1,balanced,0.09563733140627544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,16,1,balanced,0.09694400429725647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,16,1,power_law_1.01,0.06431360244750976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,16,1,power_law_1.01,0.06472960114479065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,16,1,power_law_1.2,0.06101120114326477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,16,1,power_law_1.2,0.06146559715270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,2,1,balanced,0.3137493332227071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,2,1,balanced,0.31387199958165485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,2,1,power_law_1.01,0.18109439611434935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,2,1,power_law_1.01,0.18307199478149414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,2,1,power_law_1.2,0.16743040084838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,2,1,power_law_1.2,0.1677567958831787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,32,1,balanced,0.08271466692288716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,32,1,balanced,0.08427199721336365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,32,1,power_law_1.01,0.0564736008644104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,32,1,power_law_1.01,0.05745279788970947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,32,1,power_law_1.2,0.05363199710845947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,32,1,power_law_1.2,0.05446400046348572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,4,1,balanced,0.19034665822982788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,4,1,balanced,0.1904053290685018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,4,1,power_law_1.01,0.11562880277633666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,4,1,power_law_1.01,0.11594239473342896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,4,1,power_law_1.2,0.11050239801406861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,4,1,power_law_1.2,0.11210240125656128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,8,1,balanced,0.132314662138621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,8,1,balanced,0.13294933239618936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,8,1,power_law_1.01,0.08499199748039246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,8,1,power_law_1.01,0.08562560081481933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,8,1,power_law_1.2,0.07864320278167725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,3072,1536,8,256,8,1,power_law_1.2,0.08064640164375306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,1,balanced,0.26769065856933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,1,balanced,0.2681013345718384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,1,power_law_1.01,0.2659712076187134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,1,power_law_1.01,0.27689599990844727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,1,power_law_1.2,0.27457919120788576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,1,power_law_1.2,0.2763776063919067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,2,balanced,0.17163733641306558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,2,balanced,0.17397334178288779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,2,power_law_1.01,0.16869759559631348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,2,power_law_1.01,0.17500799894332886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,2,power_law_1.2,0.1778175950050354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,2,power_law_1.2,0.17831039428710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,4,balanced,0.11372266213099162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,4,balanced,0.11772267023722331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,4,power_law_1.01,0.12580480575561523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,4,power_law_1.01,0.12943999767303466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,4,power_law_1.2,0.12165119647979736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,4,power_law_1.2,0.13336960077285767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,8,balanced,0.08954133590062459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,8,balanced,0.09097066521644592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,8,power_law_1.01,0.09797760248184204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,8,power_law_1.01,0.09990400075912476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,8,power_law_1.2,0.09262080192565918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,1,8,power_law_1.2,0.09939839839935302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,16,1,balanced,0.03759466608365377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,16,1,balanced,0.03951466580231985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,16,1,power_law_1.01,0.0383103996515274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,16,1,power_law_1.01,0.03948160111904144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,16,1,power_law_1.2,0.03893760144710541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,16,1,power_law_1.2,0.0406143993139267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,2,1,balanced,0.15677332878112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,2,1,balanced,0.1678239901860555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,2,1,power_law_1.01,0.1494271993637085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,2,1,power_law_1.01,0.15155199766159058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,2,1,power_law_1.2,0.15030399560928345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,2,1,power_law_1.2,0.15216000080108644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,32,1,balanced,0.03127466638882955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,32,1,balanced,0.031632001201311745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,32,1,power_law_1.01,0.02993279993534088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,32,1,power_law_1.01,0.03022719919681549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,32,1,power_law_1.2,0.030105599761009218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,32,1,power_law_1.2,0.030380800366401672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,4,1,balanced,0.08874666690826416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,4,1,balanced,0.08885866403579712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,4,1,power_law_1.01,0.09041280150413514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,4,1,power_law_1.01,0.09308159947395325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,4,1,power_law_1.2,0.08942720293998718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,4,1,power_law_1.2,0.09253759980201721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,8,1,balanced,0.05949333310127258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,8,1,balanced,0.06011199951171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,8,1,power_law_1.01,0.05668479800224304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,8,1,power_law_1.01,0.056704002618789676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,8,1,power_law_1.2,0.05569919943809509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,14336,2,8,8,1,power_law_1.2,0.05740159749984741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,1,balanced,0.4023946523666382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,1,balanced,0.4028533299763997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,1,power_law_1.01,0.34050559997558594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,1,power_law_1.01,0.34253439903259275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,1,power_law_1.2,0.3404223918914795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,1,power_law_1.2,0.3510591983795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,128,balanced,0.03758399933576584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,128,balanced,0.037589333951473236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,128,power_law_1.01,0.03570559918880463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,128,power_law_1.01,0.03606399893760681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,128,power_law_1.2,0.03583999872207642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,128,power_law_1.2,0.0361407995223999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,16,balanced,0.06214933097362518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,16,balanced,0.06293333570162456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,16,power_law_1.01,0.058841598033905027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,16,power_law_1.01,0.061427199840545656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,16,power_law_1.2,0.05600000023841858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,16,power_law_1.2,0.059539198875427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,2,balanced,0.2281066576639811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,2,balanced,0.23015999794006348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,2,power_law_1.01,0.19456640481948853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,2,power_law_1.01,0.20426878929138184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,2,power_law_1.2,0.19919359683990479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,2,power_law_1.2,0.20354559421539306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,32,balanced,0.04432533184687296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,32,balanced,0.045279999574025474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,32,power_law_1.01,0.043424001336097716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,32,power_law_1.01,0.043673598766326906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,32,power_law_1.2,0.04300160109996796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,32,power_law_1.2,0.04366720020771027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,4,balanced,0.14044800400733948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,4,balanced,0.14199466506640115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,4,power_law_1.01,0.13394559621810914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,4,power_law_1.01,0.13550080060958863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,4,power_law_1.2,0.13105920553207398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,4,power_law_1.2,0.13159680366516113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,64,balanced,0.0376800000667572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,64,balanced,0.037834666669368744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,64,power_law_1.01,0.03763200044631958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,64,power_law_1.01,0.03806720077991486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,64,power_law_1.2,0.03735679984092712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,64,power_law_1.2,0.03768959939479828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,8,balanced,0.08679466446240743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,8,balanced,0.08853333195050557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,8,power_law_1.01,0.07776640057563781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,8,power_law_1.01,0.08250880241394043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,8,power_law_1.2,0.0803712010383606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,1,8,power_law_1.2,0.08074880242347718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,16,1,balanced,0.0743146687746048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,16,1,balanced,0.0746559997399648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,16,1,power_law_1.01,0.06709759831428527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,16,1,power_law_1.01,0.06748160123825073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,16,1,power_law_1.2,0.0673792004585266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,16,1,power_law_1.2,0.06743040084838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,2,1,balanced,0.22914665937423706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,2,1,balanced,0.22939199209213257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,2,1,power_law_1.01,0.19585280418395995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,2,1,power_law_1.01,0.19642239809036255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,2,1,power_law_1.2,0.1924288034439087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,2,1,power_law_1.2,0.19537919759750366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,32,1,balanced,0.05996799965699514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,32,1,balanced,0.0621919979651769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,32,1,power_law_1.01,0.05459840297698974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,32,1,power_law_1.01,0.05479679703712463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,32,1,power_law_1.2,0.05475839972496033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,32,1,power_law_1.2,0.05550720095634461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,4,1,balanced,0.14564266800880432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,4,1,balanced,0.1457919975121816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,4,1,power_law_1.01,0.1338047981262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,4,1,power_law_1.01,0.13392000198364257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,4,1,power_law_1.2,0.13374719619750977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,4,1,power_law_1.2,0.1345088005065918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,8,1,balanced,0.09733866651852925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,8,1,balanced,0.09739733735720317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,8,1,power_law_1.01,0.08478080034255982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,8,1,power_law_1.01,0.08844159841537476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,8,1,power_law_1.2,0.08477439880371093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,1536,8,128,8,1,power_law_1.2,0.08584319949150085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,1,balanced,2.5990187327067056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,1,balanced,2.606112003326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,1,power_law_1.01,1.9382720947265626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,1,power_law_1.01,1.9632320404052734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,1,power_law_1.2,1.9011711120605468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,1,power_law_1.2,1.908768081665039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,128,balanced,0.08684266606966655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,128,balanced,0.08794666330019633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,128,power_law_1.01,0.0839680016040802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,128,power_law_1.01,0.0846783995628357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,128,power_law_1.2,0.0840448021888733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,128,power_law_1.2,0.08481280207633972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,16,balanced,0.23009065786997476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,16,balanced,0.2302346626917521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,16,power_law_1.01,0.20595200061798097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,16,power_law_1.01,0.21425280570983887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,16,power_law_1.2,0.21763839721679687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,16,power_law_1.2,0.22193920612335205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,2,balanced,1.3277866840362549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,2,balanced,1.3281706968943279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,2,power_law_1.01,1.0507648468017579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,2,power_law_1.01,1.0728639602661132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,2,power_law_1.2,1.0649215698242187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,2,power_law_1.2,1.070470428466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,256,balanced,0.0724373310804367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,256,balanced,0.07447466750939687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,256,power_law_1.01,0.07219200134277344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,256,power_law_1.01,0.0722495973110199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,256,power_law_1.2,0.0711359977722168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,256,power_law_1.2,0.0717631995677948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,32,balanced,0.15643733739852905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,32,balanced,0.1567306617895762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,32,power_law_1.01,0.13609600067138672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,32,power_law_1.01,0.14382079839706421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,32,power_law_1.2,0.14154239892959594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,32,power_law_1.2,0.14825600385665894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,4,balanced,0.7005813121795654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,4,balanced,0.7026399771372477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,4,power_law_1.01,0.6163839817047119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,4,power_law_1.01,0.6289535999298096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,4,power_law_1.2,0.5986112117767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,4,power_law_1.2,0.6351359844207763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,64,balanced,0.10512000322341919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,64,balanced,0.10705066720644633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,64,power_law_1.01,0.09934080243110657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,64,power_law_1.01,0.10126719474792481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,64,power_law_1.2,0.09701120257377624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,64,power_law_1.2,0.09975039958953857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,8,balanced,0.38929065068562824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,8,balanced,0.3895039955774943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,8,power_law_1.01,0.3543040037155151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,8,power_law_1.01,0.3546432018280029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,8,power_law_1.2,0.34167680740356443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,1,8,power_law_1.2,0.36910719871520997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,16,1,balanced,1.3431679407755535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,16,1,balanced,1.3447839419047039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,16,1,power_law_1.01,1.0178175926208497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,16,1,power_law_1.01,1.01910400390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,16,1,power_law_1.2,1.0007743835449219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,16,1,power_law_1.2,1.0030912399291991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,2,1,balanced,1.306949297587077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,2,1,balanced,1.3105226357777913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,2,1,power_law_1.01,0.9729087829589844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,2,1,power_law_1.01,0.9833919525146484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,2,1,power_law_1.2,0.9657152175903321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,2,1,power_law_1.2,0.970751953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,32,1,balanced,1.1337813536326091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,32,1,balanced,1.1346720059712727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,32,1,power_law_1.01,0.8600959777832031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,32,1,power_law_1.01,0.863212776184082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,32,1,power_law_1.2,0.85283203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,32,1,power_law_1.2,0.8557888031005859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,4,1,balanced,0.7150293191274008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,4,1,balanced,0.715727965037028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,4,1,power_law_1.01,0.5404863834381104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,4,1,power_law_1.01,0.544595193862915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,4,1,power_law_1.2,0.53788161277771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,4,1,power_law_1.2,0.5405248165130615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,8,1,balanced,0.42238934834798175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,8,1,balanced,0.43588801225026447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,8,1,power_law_1.01,0.3306495904922485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,8,1,power_law_1.01,0.3314111948013306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,8,1,power_law_1.2,0.3221951961517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,4096,2688,22,512,8,1,power_law_1.2,0.32924799919128417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,1,balanced,0.44228800137837726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,1,balanced,0.4467039903004964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,1,power_law_1.01,0.45382399559020997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,1,power_law_1.01,0.4705344200134277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,1,power_law_1.2,0.4722432136535645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,1,power_law_1.2,0.4729599952697754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,2,balanced,0.2493120034535726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,2,balanced,0.27002133925755817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,2,power_law_1.01,0.26733438968658446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,2,power_law_1.01,0.2682816028594971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,2,power_law_1.2,0.2629695892333984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,2,power_law_1.2,0.26943359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,4,balanced,0.1662399967511495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,4,balanced,0.17020267248153687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,4,power_law_1.01,0.17455359697341918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,4,power_law_1.01,0.18303999900817872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,4,power_law_1.2,0.1820799946784973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,4,power_law_1.2,0.18394880294799804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,8,balanced,0.1151093343893687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,8,balanced,0.11778666575749715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,8,power_law_1.01,0.13208320140838622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,8,power_law_1.01,0.1337407946586609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,8,power_law_1.2,0.12907520532608033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,1,8,power_law_1.2,0.12980480194091798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,16,1,balanced,0.059765333930651345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,16,1,balanced,0.062090665102005005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,16,1,power_law_1.01,0.05660799741744995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,16,1,power_law_1.01,0.05724160075187683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,16,1,power_law_1.2,0.05639680027961731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,16,1,power_law_1.2,0.056492799520492555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,2,1,balanced,0.23846399784088135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,2,1,balanced,0.24821333090464273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,2,1,power_law_1.01,0.23982079029083253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,2,1,power_law_1.01,0.24198400974273682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,2,1,power_law_1.2,0.23832321166992188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,2,1,power_law_1.2,0.24186239242553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,32,1,balanced,0.03760000069936117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,32,1,balanced,0.03781333317359289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,32,1,power_law_1.01,0.037299200892448425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,32,1,power_law_1.01,0.04121600091457367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,32,1,power_law_1.2,0.03809280097484589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,32,1,power_law_1.2,0.041222399473190306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,4,1,balanced,0.13343466321627298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,4,1,balanced,0.15313599507013956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,4,1,power_law_1.01,0.13185280561447144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,4,1,power_law_1.01,0.1388864040374756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,4,1,power_law_1.2,0.13855359554290772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,4,1,power_law_1.2,0.14979840517044068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,8,1,balanced,0.09498133261998494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,8,1,balanced,0.10086400310198466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,8,1,power_law_1.01,0.07991039752960205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,8,1,power_law_1.01,0.08055679798126221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,8,1,power_law_1.2,0.07988479733467102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,16384,2,8,8,1,power_law_1.2,0.08072320222854615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,1,balanced,1.541002591451009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,1,balanced,1.5429919560750325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,1,power_law_1.01,0.7969088077545166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,1,power_law_1.01,0.8138943672180176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,1,power_law_1.2,0.7337664127349853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,1,power_law_1.2,0.7411263942718506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,128,balanced,0.05641599992911021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,128,balanced,0.057946667075157166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,128,power_law_1.01,0.055327999591827395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,128,power_law_1.01,0.05568000078201294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,128,power_law_1.2,0.05571200251579285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,128,power_law_1.2,0.05605120062828064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,16,balanced,0.14618666966756186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,16,balanced,0.14643200238545737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,16,power_law_1.01,0.12641279697418212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,16,power_law_1.01,0.14421759843826293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,16,power_law_1.2,0.11240960359573364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,16,power_law_1.2,0.11498240232467652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,2,balanced,0.7941546440124512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,2,balanced,0.7974186738332113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,2,power_law_1.01,0.40008959770202634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,2,power_law_1.01,0.4559487819671631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,2,power_law_1.2,0.40615038871765136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,2,power_law_1.2,0.41050238609313966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,256,balanced,0.04965866605440775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,256,balanced,0.05036266644795736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,256,power_law_1.01,0.048390400409698484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,256,power_law_1.01,0.04886400103569031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,256,power_law_1.2,0.048467200994491574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,256,power_law_1.2,0.04901120066642761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,32,balanced,0.0929813285668691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,32,balanced,0.09393067161242168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,32,power_law_1.01,0.07758079767227173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,32,power_law_1.01,0.09246079921722412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,32,power_law_1.2,0.08056960105895997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,32,power_law_1.2,0.08111360073089599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,4,balanced,0.42556265989939374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,4,balanced,0.43216534455617267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,4,power_law_1.01,0.25883519649505615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,4,power_law_1.01,0.29348480701446533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,4,power_law_1.2,0.24860799312591553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,4,power_law_1.2,0.2598655939102173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,64,balanced,0.07260799904664357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,64,balanced,0.07455466687679291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,64,power_law_1.01,0.06933760046958923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,64,power_law_1.01,0.0703935980796814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,64,power_law_1.2,0.0688256025314331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,64,power_law_1.2,0.0692351996898651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,8,balanced,0.24148799975713095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,8,balanced,0.2422879934310913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,8,power_law_1.01,0.18572160005569457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,8,power_law_1.01,0.2123392105102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,8,power_law_1.2,0.1886016011238098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,1,8,power_law_1.2,0.2024768114089966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,16,1,balanced,0.1786080002784729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,16,1,balanced,0.17981332540512085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,16,1,power_law_1.01,0.107750403881073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,16,1,power_law_1.01,0.11096960306167603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,16,1,power_law_1.2,0.10122879743576049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,16,1,power_law_1.2,0.10289920568466186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,2,1,balanced,0.7764426867167155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,2,1,balanced,0.778170665105184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,2,1,power_law_1.01,0.4187136173248291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,2,1,power_law_1.01,0.42256641387939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,2,1,power_law_1.2,0.37484800815582275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,2,1,power_law_1.2,0.38549759387969973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,32,1,balanced,0.1404159963130951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,32,1,balanced,0.14231999715169272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,32,1,power_law_1.01,0.09544320106506347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,32,1,power_law_1.01,0.09610880017280579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,32,1,power_law_1.2,0.08851199746131896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,32,1,power_law_1.2,0.09126399755477906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,4,1,balanced,0.4331626494725545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,4,1,balanced,0.4344373146692912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,4,1,power_law_1.01,0.24179201126098632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,4,1,power_law_1.01,0.24469120502471925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,4,1,power_law_1.2,0.22018558979034425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,4,1,power_law_1.2,0.22818560600280763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,8,1,balanced,0.2659626603126526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,8,1,balanced,0.2660906712214152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,8,1,power_law_1.01,0.1610111951828003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,8,1,power_law_1.01,0.1618175983428955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,8,1,power_law_1.2,0.1446463942527771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2048,8,256,8,1,power_law_1.2,0.14521600008010865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,1,balanced,1.2117493152618408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,1,balanced,1.2119359970092773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,1,power_law_1.01,0.9659775733947754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,1,power_law_1.01,0.9761343955993652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,1,power_law_1.2,0.9533632278442383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,1,power_law_1.2,0.965459156036377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,16,balanced,0.1218986709912618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,16,balanced,0.12486933668454488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,16,power_law_1.01,0.11377919912338257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,16,power_law_1.01,0.11386239528656006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,16,power_law_1.2,0.11093120574951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,16,power_law_1.2,0.11148799657821655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,2,balanced,0.6315040191014608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,2,balanced,0.6324053208033243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,2,power_law_1.01,0.5289152145385743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,2,power_law_1.01,0.5355840206146241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,2,power_law_1.2,0.4752064228057861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,2,power_law_1.2,0.5094079971313477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,32,balanced,0.07855466504891713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,32,balanced,0.0786186655362447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,32,power_law_1.01,0.07468159794807434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,32,power_law_1.01,0.07774080038070678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,32,power_law_1.2,0.07575039863586426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,32,power_law_1.2,0.07605760097503662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,4,balanced,0.34245868523915607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,4,balanced,0.3571893374125163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,4,power_law_1.01,0.2889343976974487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,4,power_law_1.01,0.3063807964324951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,4,power_law_1.2,0.2900736093521118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,4,power_law_1.2,0.3033983945846558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,8,balanced,0.1927786668141683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,8,balanced,0.19375999768575033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,8,power_law_1.01,0.1821951985359192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,8,power_law_1.01,0.1891711950302124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,8,power_law_1.2,0.17152639627456664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,1,8,power_law_1.2,0.18629759550094604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,16,1,balanced,0.14637866616249084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,16,1,balanced,0.15030399958292642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,16,1,power_law_1.01,0.12137600183486938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,16,1,power_law_1.01,0.1218559980392456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,16,1,power_law_1.2,0.11537280082702636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,16,1,power_law_1.2,0.12004480361938477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,2,1,balanced,0.6175680160522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,2,1,balanced,0.6195253531138102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,2,1,power_law_1.01,0.48856320381164553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,2,1,power_law_1.01,0.49385600090026854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,2,1,power_law_1.2,0.4872000217437744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,2,1,power_law_1.2,0.488102388381958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,32,1,balanced,0.10957333445549011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,32,1,balanced,0.10971732934315999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,32,1,power_law_1.01,0.09238399863243103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,32,1,power_law_1.01,0.09276800155639649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,32,1,power_law_1.2,0.09114239811897278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,32,1,power_law_1.2,0.0929535984992981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,4,1,balanced,0.3440213203430176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,4,1,balanced,0.34479467074076336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,4,1,power_law_1.01,0.27480320930480956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,4,1,power_law_1.01,0.27765119075775146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,4,1,power_law_1.2,0.2666624069213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,4,1,power_law_1.2,0.27360000610351565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,8,1,balanced,0.21401600042978922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,8,1,balanced,0.21804267168045044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,8,1,power_law_1.01,0.1802559971809387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,8,1,power_law_1.01,0.18246400356292725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,8,1,power_law_1.2,0.1779263973236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,6144,2560,8,160,8,1,power_law_1.2,0.18140159845352172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,1,balanced,1.7974613507588704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,1,balanced,1.7995999654134114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,1,power_law_1.01,0.9027071952819824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,1,power_law_1.01,0.9451583862304688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,1,power_law_1.2,0.8619071960449218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,1,power_law_1.2,0.8676671981811523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,128,balanced,0.06228266656398773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,128,balanced,0.06451733410358429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,128,power_law_1.01,0.06222720146179199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,128,power_law_1.01,0.06458240151405334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,128,power_law_1.2,0.06437119841575623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,128,power_law_1.2,0.06554880142211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,16,balanced,0.16423466801643372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,16,balanced,0.16497600078582764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,16,power_law_1.01,0.12577279806137084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,16,power_law_1.01,0.14977279901504517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,16,power_law_1.2,0.11303039789199829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,16,power_law_1.2,0.13191039562225343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,2,balanced,0.9246666431427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,2,balanced,0.927354653676351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,2,power_law_1.01,0.5045695781707764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,2,power_law_1.01,0.5516223907470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,2,power_law_1.2,0.5117631912231445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,2,power_law_1.2,0.5253632068634033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,256,balanced,0.054101333022117615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,256,balanced,0.05412800113360087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,256,power_law_1.01,0.05306879878044128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,256,power_law_1.01,0.053363198041915895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,256,power_law_1.2,0.052665597200393675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,256,power_law_1.2,0.054476797580718994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,32,balanced,0.10710933804512024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,32,balanced,0.10909333825111389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,32,power_law_1.01,0.089273601770401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,32,power_law_1.01,0.09925119876861573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,32,power_law_1.2,0.09040639996528625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,32,power_law_1.2,0.09126399755477906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,4,balanced,0.49885332584381104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,4,balanced,0.5396159887313843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,4,power_law_1.01,0.2975935935974121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,4,power_law_1.01,0.32403199672698973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,4,power_law_1.2,0.30737919807434083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,4,power_law_1.2,0.3135871887207031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,64,balanced,0.08029333253701527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,64,balanced,0.08061333497365315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,64,power_law_1.01,0.07543039917945862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,64,power_law_1.01,0.07800319790840149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,64,power_law_1.2,0.07335039973258972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,64,power_law_1.2,0.07441279888153077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,8,balanced,0.27158933877944946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,8,balanced,0.280623992284139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,8,power_law_1.01,0.21722879409790039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,8,power_law_1.01,0.24131200313568116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,8,power_law_1.2,0.21998720169067382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,1,8,power_law_1.2,0.23703041076660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,16,1,balanced,0.20001065731048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,16,1,balanced,0.2069759964942932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,16,1,power_law_1.01,0.12275199890136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,16,1,power_law_1.01,0.12296960353851319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,16,1,power_law_1.2,0.11468160152435303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,16,1,power_law_1.2,0.1147968053817749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,2,1,balanced,0.9054880142211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,2,1,balanced,0.9096693197886149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,2,1,power_law_1.01,0.4796480178833008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,2,1,power_law_1.01,0.4902463912963867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,2,1,power_law_1.2,0.42814078330993655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,2,1,power_law_1.2,0.440396785736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,32,1,balanced,0.15853333473205566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,32,1,balanced,0.1588533322016398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,32,1,power_law_1.01,0.10711679458618165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,32,1,power_law_1.01,0.10790400505065918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,32,1,power_law_1.2,0.10127359628677368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,32,1,power_law_1.2,0.10209920406341552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,4,1,balanced,0.5017760197321574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,4,1,balanced,0.5107306639353434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,4,1,power_law_1.01,0.2832256078720093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,4,1,power_law_1.01,0.286297607421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,4,1,power_law_1.2,0.2632191896438599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,4,1,power_law_1.2,0.26888959407806395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,8,1,balanced,0.30554133653640747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,8,1,balanced,0.30796267588933307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,8,1,power_law_1.01,0.17801599502563475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,8,1,power_law_1.01,0.17920639514923095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,8,1,power_law_1.2,0.16406400203704835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,256,8,1,power_law_1.2,0.16748160123825073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,1,balanced,1.8032159805297852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,1,balanced,1.8059306144714355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,1,power_law_1.01,1.1706048011779786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,1,power_law_1.01,1.1736895561218261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,1,power_law_1.2,1.062393569946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,1,power_law_1.2,1.0664064407348632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,128,balanced,0.06482133269309998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,128,balanced,0.06637333333492279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,128,power_law_1.01,0.06995840072631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,128,power_law_1.01,0.07167360186576843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,128,power_law_1.2,0.06915839910507202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,128,power_law_1.2,0.07031040191650391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,16,balanced,0.16317333777745566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,16,balanced,0.16334399580955505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,16,power_law_1.01,0.2040191888809204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,16,power_law_1.01,0.21679999828338622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,16,power_law_1.2,0.19645440578460693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,16,power_law_1.2,0.21633920669555665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,2,balanced,0.9281333287556967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,2,balanced,0.9288907051086426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,2,power_law_1.01,0.6941440105438232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,2,power_law_1.01,0.7011263847351075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,2,power_law_1.2,0.6487743854522705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,2,power_law_1.2,0.6514304161071778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,32,balanced,0.10693867007891338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,32,balanced,0.10897599657376607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,32,power_law_1.01,0.12924799919128419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,32,power_law_1.01,0.1359295964241028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,32,power_law_1.2,0.12454400062561036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,32,power_law_1.2,0.14395519495010375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,4,balanced,0.4918400049209595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,4,balanced,0.4937066634496053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,4,power_law_1.01,0.41558399200439455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,4,power_law_1.01,0.4643199920654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,4,power_law_1.2,0.4183551788330078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,4,power_law_1.2,0.43766398429870607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,64,balanced,0.08057599763075511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,64,balanced,0.08201600114504497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,64,power_law_1.01,0.08554880023002624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,64,power_law_1.01,0.08557440042495727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,64,power_law_1.2,0.08234239816665649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,64,power_law_1.2,0.08481919765472412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,8,balanced,0.27568533023198444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,8,balanced,0.2762933373451233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,8,power_law_1.01,0.28857600688934326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,8,power_law_1.01,0.298854398727417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,8,power_law_1.2,0.2755392074584961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,1,8,power_law_1.2,0.32947840690612795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,16,1,balanced,0.20190932353337607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,16,1,balanced,0.20362667242685953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,16,1,power_law_1.01,0.1496384024620056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,16,1,power_law_1.01,0.15191680192947388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,16,1,power_law_1.2,0.13354239463806153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,16,1,power_law_1.2,0.1336192011833191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,2,1,balanced,0.9051093260447184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,2,1,balanced,0.9074026743570963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,2,1,power_law_1.01,0.5937664031982421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,2,1,power_law_1.01,0.5983168125152588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,2,1,power_law_1.2,0.551206398010254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,2,1,power_law_1.2,0.5516608238220215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,32,1,balanced,0.1604159971078237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,32,1,balanced,0.16050133109092712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,32,1,power_law_1.01,0.1181439995765686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,32,1,power_law_1.01,0.12074240446090698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,32,1,power_law_1.2,0.11374720335006713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,32,1,power_law_1.2,0.11418880224227905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,4,1,balanced,0.5029386679331461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,4,1,balanced,0.5034559965133667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,4,1,power_law_1.01,0.3382080078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,4,1,power_law_1.01,0.34018559455871583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,4,1,power_law_1.2,0.3111936092376709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,4,1,power_law_1.2,0.3126399993896484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,8,1,balanced,0.3022186756134033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,8,1,balanced,0.3024746576944987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,8,1,power_law_1.01,0.21674880981445313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,8,1,power_law_1.01,0.21755518913269042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,8,1,power_law_1.2,0.20015358924865723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,32,7168,2048,8,384,8,1,power_law_1.2,0.20361599922180176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,1,balanced,0.15344533324241638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,1,balanced,0.15457600355148315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,1,power_law_1.01,0.1498304009437561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,1,power_law_1.01,0.14991999864578248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,1,power_law_1.2,0.15112320184707642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,1,power_law_1.2,0.15184639692306517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,128,balanced,0.057855998476346336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,128,balanced,0.058037335673967995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,128,power_law_1.01,0.055641597509384154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,128,power_law_1.01,0.055929601192474365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,128,power_law_1.2,0.05575680136680603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,128,power_law_1.2,0.05611519813537598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,16,balanced,0.057855998476346336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,16,balanced,0.05823466678460439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,16,power_law_1.01,0.05807999968528747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,16,power_law_1.01,0.05817599892616272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,16,power_law_1.2,0.058143997192382814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,16,power_law_1.2,0.0585919976234436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,2,balanced,0.10712533195813496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,2,balanced,0.10774399836858113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,2,power_law_1.01,0.10589439868927002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,2,power_law_1.01,0.10668799877166749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,2,power_law_1.2,0.10864640474319458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,2,power_law_1.2,0.1089087963104248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,32,balanced,0.057962665955225624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,32,balanced,0.05824000140031179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,32,power_law_1.01,0.05624319911003113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,32,power_law_1.01,0.05630080103874206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,32,power_law_1.2,0.05678719878196716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,32,power_law_1.2,0.05719040036201477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,4,balanced,0.08451199531555176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,4,balanced,0.08513066172599792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,4,power_law_1.01,0.08528640270233154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,4,power_law_1.01,0.08543360233306885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,4,power_law_1.2,0.08592000007629394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,4,power_law_1.2,0.08766720294952393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,64,balanced,0.05791999896367391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,64,balanced,0.05808533231417338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,64,power_law_1.01,0.05566080212593079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,64,power_law_1.01,0.05666559934616089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,64,power_law_1.2,0.057036799192428586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,64,power_law_1.2,0.0572160005569458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,8,balanced,0.06398933132489522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,8,balanced,0.0655680000782013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,8,power_law_1.01,0.06559360027313232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,8,power_law_1.01,0.06732800006866455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,8,power_law_1.2,0.06596480011940002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,1,8,power_law_1.2,0.06746879816055298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,2,1,balanced,0.1018239955107371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,2,1,balanced,0.10333866874376933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,2,1,power_law_1.01,0.10115840435028076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,2,1,power_law_1.01,0.10140800476074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,2,1,power_law_1.2,0.10372480154037475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,2,1,power_law_1.2,0.10448000431060792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,4,1,balanced,0.08070399860541026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,4,1,balanced,0.08086400230725606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,4,1,power_law_1.01,0.07945600152015686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,4,1,power_law_1.01,0.08071039915084839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,4,1,power_law_1.2,0.08039039969444275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2048,768,8,128,4,1,power_law_1.2,0.08152959942817688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,1,balanced,0.3673493464787801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,1,balanced,0.3689333200454712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,1,power_law_1.01,0.34530560970306395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,1,power_law_1.01,0.35306880474090574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,1,power_law_1.2,0.3542207956314087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,1,power_law_1.2,0.35766398906707764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,128,balanced,0.07693866888682048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,128,balanced,0.07838400204976399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,128,power_law_1.01,0.07744640111923218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,128,power_law_1.01,0.07785599827766418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,128,power_law_1.2,0.07823359966278076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,128,power_law_1.2,0.07839360237121581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,16,balanced,0.09058133761088054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,16,balanced,0.09170132875442505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,16,power_law_1.01,0.08781440258026123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,16,power_law_1.01,0.09086719751358033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,16,power_law_1.2,0.08882560133934021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,16,power_law_1.2,0.09041280150413514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,2,balanced,0.23076266050338745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,2,balanced,0.23368000984191895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,2,power_law_1.01,0.22148480415344238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,2,power_law_1.01,0.22536320686340333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,2,power_law_1.2,0.22364161014556885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,2,power_law_1.2,0.22675199508666993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,32,balanced,0.07975466549396515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,32,balanced,0.08473066488901775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,32,power_law_1.01,0.08309119939804077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,32,power_law_1.01,0.08383359909057617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,32,power_law_1.2,0.0830847978591919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,32,power_law_1.2,0.08359040021896362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,4,balanced,0.15778133273124695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,4,balanced,0.1584160029888153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,4,power_law_1.01,0.14935679435729982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,4,power_law_1.01,0.15070719718933107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,4,power_law_1.2,0.15199999809265136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,4,power_law_1.2,0.15454720258712767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,64,balanced,0.0786186655362447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,64,balanced,0.07863999903202057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,64,power_law_1.01,0.07822719812393189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,64,power_law_1.01,0.07902079820632935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,64,power_law_1.2,0.07875199913978577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,64,power_law_1.2,0.07904639840126038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,8,balanced,0.11783466736475627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,8,balanced,0.11943466464678447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,8,power_law_1.01,0.11432960033416747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,8,power_law_1.01,0.11697920560836791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,8,power_law_1.2,0.1174015998840332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,1,8,power_law_1.2,0.11819519996643066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,16,1,balanced,0.3317013382911682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,16,1,balanced,0.3330453236897786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,16,1,power_law_1.01,0.3216576099395752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,16,1,power_law_1.01,0.32717440128326414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,16,1,power_law_1.2,0.32889599800109864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,16,1,power_law_1.2,0.3359872102737427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,2,1,balanced,0.21854400634765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,2,1,balanced,0.22095467646916708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,2,1,power_law_1.01,0.20855040550231935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,2,1,power_law_1.01,0.21127040386199952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,2,1,power_law_1.2,0.21059839725494384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,2,1,power_law_1.2,0.21421439647674562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,32,1,balanced,0.29365332921346027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,32,1,balanced,0.2948053280512492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,32,1,power_law_1.01,0.28497920036315916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,32,1,power_law_1.01,0.2865407943725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,32,1,power_law_1.2,0.2940095901489258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,32,1,power_law_1.2,0.2974463939666748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,4,1,balanced,0.14355199535687765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,4,1,balanced,0.14386666814486185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,4,1,power_law_1.01,0.13887360095977783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,4,1,power_law_1.01,0.13976320028305053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,4,1,power_law_1.2,0.1405184030532837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,4,1,power_law_1.2,0.14248960018157958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,8,1,balanced,0.430949330329895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,8,1,balanced,0.4325386683146159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,8,1,power_law_1.01,0.4150720119476318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,8,1,power_law_1.01,0.4186560153961182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,8,1,power_law_1.2,0.42557439804077146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,2688,1856,6,128,8,1,power_law_1.2,0.4344128131866455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,1,balanced,0.6176000038782755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,1,balanced,0.6185226837793986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,1,power_law_1.01,0.5512383937835693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,1,power_law_1.01,0.5552063941955566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,1,power_law_1.2,0.5527232170104981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,1,power_law_1.2,0.5613759994506836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,128,balanced,0.1133066713809967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,128,balanced,0.11359999577204387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,128,power_law_1.01,0.1110975980758667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,128,power_law_1.01,0.11130239963531494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,128,power_law_1.2,0.1126207947731018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,128,power_law_1.2,0.112716805934906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,16,balanced,0.1479039986928304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,16,balanced,0.148117333650589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,16,power_law_1.01,0.13719680309295654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,16,power_law_1.01,0.13808640241622924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,16,power_law_1.2,0.14017280340194702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,16,power_law_1.2,0.14508800506591796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,2,balanced,0.3744106690088908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,2,balanced,0.3755733172098796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,2,power_law_1.01,0.3469311952590942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,2,power_law_1.01,0.3523200035095215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,2,power_law_1.2,0.33676159381866455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,2,power_law_1.2,0.3480767965316772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,256,balanced,0.11317867040634155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,256,balanced,0.113237331310908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,256,power_law_1.01,0.11088639497756958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,256,power_law_1.01,0.11121920347213746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,256,power_law_1.2,0.11118719577789307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,256,power_law_1.2,0.11160320043563843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,32,balanced,0.12322133779525757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,32,balanced,0.12441600362459819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,32,power_law_1.01,0.12122880220413208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,32,power_law_1.01,0.12135679721832275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,32,power_law_1.2,0.12282880544662475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,32,power_law_1.2,0.1238144040107727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,4,balanced,0.24766399463017783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,4,balanced,0.2479520042737325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,4,power_law_1.01,0.23681919574737548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,4,power_law_1.01,0.23880960941314697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,4,power_law_1.2,0.2349247932434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,4,power_law_1.2,0.24060800075531005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,64,balanced,0.11541866262753804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,64,balanced,0.11725333333015442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,64,power_law_1.01,0.11495039463043213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,64,power_law_1.01,0.1152448058128357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,64,power_law_1.2,0.11681920289993286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,64,power_law_1.2,0.11693439483642579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,8,balanced,0.1798186699549357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,8,balanced,0.18106132745742798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,8,power_law_1.01,0.1701311945915222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,8,power_law_1.01,0.17072639465332032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,8,power_law_1.2,0.17153279781341552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,1,8,power_law_1.2,0.17284480333328248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,16,1,balanced,0.141157329082489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,16,1,balanced,0.1411786675453186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,16,1,power_law_1.01,0.12576639652252197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,16,1,power_law_1.01,0.1283455967903137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,16,1,power_law_1.2,0.13301119804382325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,16,1,power_law_1.2,0.13308800458908082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,2,1,balanced,0.3489546775817871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,2,1,balanced,0.34906665484110516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,2,1,power_law_1.01,0.3190144062042236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,2,1,power_law_1.01,0.3240895986557007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,2,1,power_law_1.2,0.32164480686187746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,2,1,power_law_1.2,0.3306623935699463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,32,1,balanced,0.12161067128181458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,32,1,balanced,0.12245866656303406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,32,1,power_law_1.01,0.11485439538955688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,32,1,power_law_1.01,0.11501439809799194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,32,1,power_law_1.2,0.11507200002670288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,32,1,power_law_1.2,0.116211199760437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,4,1,balanced,0.22438400983810425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,4,1,balanced,0.22618667284647623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,4,1,power_law_1.01,0.20565121173858641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,4,1,power_law_1.01,0.20837759971618652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,4,1,power_law_1.2,0.20993280410766602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,4,1,power_law_1.2,0.21307520866394042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,8,1,balanced,0.16375466187795004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,8,1,balanced,0.16459199786186218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,8,1,power_law_1.01,0.15478399991989136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,8,1,power_law_1.01,0.1554304003715515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,8,1,power_law_1.2,0.15518720149993898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,3072,1536,8,256,8,1,power_law_1.2,0.15539200305938722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,1,balanced,0.4164586861928304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,1,balanced,0.4184960126876831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,1,power_law_1.01,0.4338816165924072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,1,power_law_1.01,0.4374591827392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,1,power_law_1.2,0.4190783977508545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,1,power_law_1.2,0.4219007968902588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,2,balanced,0.2558773358662923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,2,balanced,0.25657065709431964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,2,power_law_1.01,0.28296959400177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,2,power_law_1.01,0.2900799989700317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,2,power_law_1.2,0.2739840030670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,2,power_law_1.2,0.2944191932678223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,4,balanced,0.1997119983037313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,4,balanced,0.20007999738057455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,4,power_law_1.01,0.21155838966369628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,4,power_law_1.01,0.22561919689178467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,4,power_law_1.2,0.2159872055053711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,4,power_law_1.2,0.22044799327850342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,8,balanced,0.17757866779963175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,8,balanced,0.17791465918223062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,8,power_law_1.01,0.19409919977188111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,8,power_law_1.01,0.19473279714584352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,8,power_law_1.2,0.1948799967765808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,1,8,power_law_1.2,0.19493759870529176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,16,1,balanced,0.06586133440335591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,16,1,balanced,0.07231466472148895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,16,1,power_law_1.01,0.06695680022239685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,16,1,power_law_1.01,0.06865280270576476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,16,1,power_law_1.2,0.06872959733009339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,16,1,power_law_1.2,0.06922879815101624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,2,1,balanced,0.23626132806142172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,2,1,balanced,0.23637332518895468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,2,1,power_law_1.01,0.2298815965652466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,2,1,power_law_1.01,0.23172481060028077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,2,1,power_law_1.2,0.2283776044845581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,2,1,power_law_1.2,0.23363199234008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,32,1,balanced,0.0496319979429245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,32,1,balanced,0.05402666827042898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,32,1,power_law_1.01,0.04833920001983642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,32,1,power_law_1.01,0.048582398891448976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,32,1,power_law_1.2,0.04837760031223297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,32,1,power_law_1.2,0.0522816002368927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,4,1,balanced,0.1442506710688273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,4,1,balanced,0.14566399653752646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,4,1,power_law_1.01,0.1310271978378296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,4,1,power_law_1.01,0.13319040536880494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,4,1,power_law_1.2,0.13328640460968016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,4,1,power_law_1.2,0.13495680093765258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,8,1,balanced,0.09684800108273824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,8,1,balanced,0.10032000144322713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,8,1,power_law_1.01,0.08733440041542054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,8,1,power_law_1.01,0.09370880126953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,8,1,power_law_1.2,0.08627840280532836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,14336,2,8,8,1,power_law_1.2,0.08840320110321045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,1,balanced,0.4361813465754191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,1,balanced,0.43856000900268555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,1,power_law_1.01,0.43999361991882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,1,power_law_1.01,0.4407487869262695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,1,power_law_1.2,0.44637441635131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,1,power_law_1.2,0.45036802291870115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,128,balanced,0.08892800410588582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,128,balanced,0.08925333619117737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,128,power_law_1.01,0.09047039747238159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,128,power_law_1.01,0.09130880236625671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,128,power_law_1.2,0.09132159948348999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,128,power_law_1.2,0.09146239757537841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,16,balanced,0.10541333754857381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,16,balanced,0.1060693363348643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,16,power_law_1.01,0.10773760080337524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,16,power_law_1.01,0.11068160533905029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,16,power_law_1.2,0.11056640148162841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,16,power_law_1.2,0.11075199842453003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,2,balanced,0.27108800411224365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,2,balanced,0.27264533440272015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,2,power_law_1.01,0.2635200023651123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,2,power_law_1.01,0.26571519374847413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,2,power_law_1.2,0.27143039703369143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,2,power_law_1.2,0.273907208442688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,32,balanced,0.09603733817736308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,32,balanced,0.0972053309281667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,32,power_law_1.01,0.0979968011379242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,32,power_law_1.01,0.09853439927101135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,32,power_law_1.2,0.09985920190811157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,32,power_law_1.2,0.09991679787635803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,4,balanced,0.18010133504867554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,4,balanced,0.18095999956130981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,4,power_law_1.01,0.186080002784729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,4,power_law_1.01,0.18630399703979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,4,power_law_1.2,0.18598400354385375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,4,power_law_1.2,0.18772480487823487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,64,balanced,0.09329066673914592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,64,balanced,0.09386133154233296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,64,power_law_1.01,0.09285119771957398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,64,power_law_1.01,0.09355520009994507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,64,power_law_1.2,0.09415040016174317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,64,power_law_1.2,0.09485440254211426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,8,balanced,0.13769066333770752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,8,balanced,0.13802133003870645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,8,power_law_1.01,0.14045439958572387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,8,power_law_1.01,0.14075520038604736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,8,power_law_1.2,0.14013439416885376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,1,8,power_law_1.2,0.14046720266342164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,16,1,balanced,0.11085333426793416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,16,1,balanced,0.11134399970372517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,16,1,power_law_1.01,0.10972800254821777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,16,1,power_law_1.01,0.11052800416946411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,16,1,power_law_1.2,0.11082240343093872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,2,1,balanced,0.25779734055201214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,2,1,balanced,0.2587520082791646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,2,1,power_law_1.01,0.253875207901001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,2,1,power_law_1.01,0.2545919895172119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,2,1,power_law_1.2,0.2551743984222412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,2,1,power_law_1.2,0.2566976070404053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,32,1,balanced,0.10296000043551128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,32,1,balanced,0.10340799887975057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,32,1,power_law_1.01,0.1023743987083435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,32,1,power_law_1.01,0.10241919755935669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,32,1,power_law_1.2,0.10300159454345703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,32,1,power_law_1.2,0.10328320264816285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,4,1,balanced,0.16766933600107828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,4,1,balanced,0.1690559983253479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,4,1,power_law_1.01,0.16465920209884644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,4,1,power_law_1.01,0.16621439456939696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,4,1,power_law_1.2,0.16839679479598998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,4,1,power_law_1.2,0.16970880031585694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,8,1,balanced,0.12780800461769104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,8,1,balanced,0.12851199507713318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,8,1,power_law_1.01,0.12696319818496704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,8,1,power_law_1.01,0.12728960514068605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,8,1,power_law_1.2,0.12729599475860595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,1536,8,128,8,1,power_law_1.2,0.1319551944732666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,1,balanced,2.825765291849772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,1,balanced,2.846405347188314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,1,power_law_1.01,2.5677120208740236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,1,power_law_1.01,2.6308416366577148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,1,power_law_1.2,2.6415359497070314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,1,power_law_1.2,2.705561637878418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,128,balanced,0.34003734588623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,128,balanced,0.3408000071843465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,128,power_law_1.01,0.34138240814208987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,128,power_law_1.01,0.34156160354614257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,128,power_law_1.2,0.3443392038345337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,128,power_law_1.2,0.3447743892669678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,16,balanced,0.49930667877197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,16,balanced,0.5015146732330322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,16,power_law_1.01,0.48446078300476075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,16,power_law_1.01,0.4846335887908936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,16,power_law_1.2,0.4911359786987305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,16,power_law_1.2,0.49292798042297364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,2,balanced,1.5577279726664226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,2,balanced,1.5728267033894856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,2,power_law_1.01,1.4542336463928223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,2,power_law_1.01,1.4625215530395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,2,power_law_1.2,1.5046400070190429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,2,power_law_1.2,1.5059967994689942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,256,balanced,0.3367840051651001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,256,balanced,0.3373226722081502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,256,power_law_1.01,0.3358207941055298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,256,power_law_1.01,0.33666560649871824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,256,power_law_1.2,0.3368767976760864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,256,power_law_1.2,0.3375808000564575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,32,balanced,0.41225600242614746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,32,balanced,0.4129759867986043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,32,power_law_1.01,0.404633617401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,32,power_law_1.01,0.4112959861755371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,32,power_law_1.2,0.4141248226165771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,32,power_law_1.2,0.4141632080078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,4,balanced,0.9526879787445068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,4,balanced,0.9572319984436035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,4,power_law_1.01,0.896998405456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,4,power_law_1.01,0.9035455703735351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,4,power_law_1.2,0.917574405670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,4,power_law_1.2,0.9233792304992676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,64,balanced,0.36086400349934894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,64,balanced,0.36348267396291095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,64,power_law_1.01,0.3670016050338745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,64,power_law_1.01,0.3686079978942871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,64,power_law_1.2,0.3733376026153564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,64,power_law_1.2,0.3813632011413574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,8,balanced,0.6524693171183268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,8,balanced,0.6534186601638794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,8,power_law_1.01,0.6296192169189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,8,power_law_1.01,0.6330880165100098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,8,power_law_1.2,0.6331776142120361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,1,8,power_law_1.2,0.648518419265747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,16,1,balanced,2.311744054158529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,16,1,balanced,2.3129067420959473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,16,1,power_law_1.01,2.198649597167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,16,1,power_law_1.01,2.2028224945068358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,16,1,power_law_1.2,2.28472957611084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,16,1,power_law_1.2,2.2912128448486326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,2,1,balanced,1.457584063212077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,2,1,balanced,1.4703307151794434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,2,1,power_law_1.01,1.3322751998901368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,2,1,power_law_1.01,1.3391039848327637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,2,1,power_law_1.2,1.3876992225646974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,2,1,power_law_1.2,1.3981760025024415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,32,1,balanced,1.797013282775879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,32,1,balanced,1.7988640467325847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,32,1,power_law_1.01,1.7031744003295899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,32,1,power_law_1.01,1.73306884765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,32,1,power_law_1.2,1.8015104293823243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,32,1,power_law_1.2,1.8068223953247071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,4,1,balanced,0.8238080342610677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,4,1,balanced,0.8256213665008545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,4,1,power_law_1.01,0.7753983974456787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,4,1,power_law_1.01,0.7775487899780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,4,1,power_law_1.2,0.8045951843261718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,4,1,power_law_1.2,0.8055423736572266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,8,1,balanced,0.5208106835683187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,8,1,balanced,0.5218293269475301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,8,1,power_law_1.01,0.4935999870300293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,8,1,power_law_1.01,0.5002240180969239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,8,1,power_law_1.2,0.5132927894592285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,4096,2688,22,512,8,1,power_law_1.2,0.5159999847412109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,1,balanced,0.6810133457183838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,1,balanced,0.6837653319040934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,1,power_law_1.01,0.6577343940734863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,1,power_law_1.01,0.6748415946960449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,1,power_law_1.2,0.6577023983001709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,1,power_law_1.2,0.6719999790191651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,2,balanced,0.3901546796162923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,2,balanced,0.3952373266220093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,2,power_law_1.01,0.4465151786804199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,2,power_law_1.01,0.46248321533203124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,2,power_law_1.2,0.4217984199523926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,2,power_law_1.2,0.42515201568603517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,4,balanced,0.258133331934611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,4,balanced,0.2602826754252116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,4,power_law_1.01,0.27974400520324705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,4,power_law_1.01,0.2814784049987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,4,power_law_1.2,0.2857919931411743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,4,power_law_1.2,0.30023679733276365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,8,balanced,0.21843733390172324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,8,balanced,0.2192266583442688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,8,power_law_1.01,0.23849599361419677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,8,power_law_1.01,0.249183988571167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,8,power_law_1.2,0.24522240161895753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,1,8,power_law_1.2,0.2470463991165161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,16,1,balanced,0.09246399998664856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,16,1,balanced,0.09266133109728496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,16,1,power_law_1.01,0.08844799995422363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,16,1,power_law_1.01,0.08888319730758668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,16,1,power_law_1.2,0.08812159895896912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,16,1,power_law_1.2,0.08912000060081482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,2,1,balanced,0.33900801340738934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,2,1,balanced,0.33955200513203937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,2,1,power_law_1.01,0.3383039951324463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,2,1,power_law_1.01,0.34291839599609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,2,1,power_law_1.2,0.33597440719604493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,2,1,power_law_1.2,0.3465087890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,32,1,balanced,0.0746506651242574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,32,1,balanced,0.07869333525498708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,32,1,power_law_1.01,0.07694720029830933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,32,1,power_law_1.01,0.07713279724121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,32,1,power_law_1.2,0.07627519965171814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,32,1,power_law_1.2,0.07660160064697266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,4,1,balanced,0.20002132654190063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,4,1,balanced,0.20107734203338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,4,1,power_law_1.01,0.18973439931869507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,4,1,power_law_1.01,0.19498239755630492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,4,1,power_law_1.2,0.19663360118865966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,4,1,power_law_1.2,0.19689600467681884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,8,1,balanced,0.1341386636098226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,8,1,balanced,0.13499200344085693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,8,1,power_law_1.01,0.12497919797897339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,8,1,power_law_1.01,0.12868479490280152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,8,1,power_law_1.2,0.1276927947998047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,16384,2,8,8,1,power_law_1.2,0.1295807957649231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,1,balanced,1.6003306706746419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,1,balanced,1.6099467277526855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,1,power_law_1.01,1.3577535629272461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,1,power_law_1.01,1.3814784049987794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,1,power_law_1.2,1.4170240402221679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,1,power_law_1.2,1.4656384468078614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,128,balanced,0.17857066790262857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,128,balanced,0.1802240014076233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,128,power_law_1.01,0.17681920528411865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,128,power_law_1.01,0.1771008014678955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,128,power_law_1.2,0.17701760530471802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,128,power_law_1.2,0.17794560194015502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,16,balanced,0.2657173275947571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,16,balanced,0.26703999439875287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,16,power_law_1.01,0.2589119911193848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,16,power_law_1.01,0.26177918910980225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,16,power_law_1.2,0.260096001625061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,16,power_law_1.2,0.26180479526519773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,2,balanced,0.8819680213928223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,2,balanced,0.8842933177947998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,2,power_law_1.01,0.7920832157135009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,2,power_law_1.01,0.8022527694702148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,2,power_law_1.2,0.7896959781646729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,2,power_law_1.2,0.8216192245483398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,256,balanced,0.17463467518488565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,256,balanced,0.17493333419164023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,256,power_law_1.01,0.17331199645996093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,256,power_law_1.01,0.17412480115890502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,256,power_law_1.2,0.17574399709701538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,256,power_law_1.2,0.1759935975074768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,32,balanced,0.2062079906463623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,32,balanced,0.2068586746851603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,32,power_law_1.01,0.1981951951980591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,32,power_law_1.01,0.2022655963897705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,32,power_law_1.2,0.20315520763397216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,32,power_law_1.2,0.20858240127563477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,4,balanced,0.5262506802876791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,4,balanced,0.5267626841862997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,4,power_law_1.01,0.47736320495605467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,4,power_law_1.01,0.5033279895782471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,4,power_law_1.2,0.5029439926147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,4,power_law_1.2,0.5083392143249512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,64,balanced,0.18120533227920532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,64,balanced,0.18301333983739218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,64,power_law_1.01,0.17994879484176635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,64,power_law_1.01,0.18008960485458375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,64,power_law_1.2,0.18056960105895997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,64,power_law_1.2,0.18268799781799316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,8,balanced,0.3545973300933838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,8,balanced,0.35523200035095215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,8,power_law_1.01,0.33355519771575926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,8,power_law_1.01,0.3483776092529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,8,power_law_1.2,0.33780479431152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,1,8,power_law_1.2,0.3478656053543091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,16,1,balanced,0.25538132588068646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,16,1,balanced,0.25625600417455036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,16,1,power_law_1.01,0.23121280670166017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,16,1,power_law_1.01,0.24138240814208983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,16,1,power_law_1.2,0.24416000843048097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,16,1,power_law_1.2,0.24600319862365722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,2,1,balanced,0.8319466908772787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,2,1,balanced,0.8392586708068848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,2,1,power_law_1.01,0.7392191886901855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,2,1,power_law_1.01,0.7529727935791015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,2,1,power_law_1.2,0.7452032089233398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,2,1,power_law_1.2,0.7638144016265869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,32,1,balanced,0.2124639948209127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,32,1,balanced,0.21381866931915283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,32,1,power_law_1.01,0.2026815891265869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,32,1,power_law_1.01,0.20355839729309083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,32,1,power_law_1.2,0.20492799282073976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,32,1,power_law_1.2,0.20519680976867677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,4,1,balanced,0.48340801397959393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,4,1,balanced,0.48393066724141437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,4,1,power_law_1.01,0.4444096088409424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,4,1,power_law_1.01,0.4472320079803467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,4,1,power_law_1.2,0.4478784084320068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,4,1,power_law_1.2,0.45124478340148927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,8,1,balanced,0.32810133695602417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,8,1,balanced,0.3282453417778015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,8,1,power_law_1.01,0.2914432048797607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,8,1,power_law_1.01,0.30478720664978026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,8,1,power_law_1.2,0.3088896036148071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2048,8,256,8,1,power_law_1.2,0.3111743927001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,1,balanced,1.2401706377665203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,1,balanced,1.2489653428395588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,1,power_law_1.01,1.1790271759033204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,1,power_law_1.01,1.187110424041748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,1,power_law_1.2,1.230131244659424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,1,power_law_1.2,1.2328127861022948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,16,balanced,0.218560000260671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,16,balanced,0.21978133916854858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,16,power_law_1.01,0.21910400390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,16,power_law_1.01,0.2202687978744507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,16,power_law_1.2,0.21875200271606446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,16,power_law_1.2,0.21986560821533202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,2,balanced,0.6949919859568278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,2,balanced,0.6964106559753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,2,power_law_1.01,0.6761919975280761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,2,power_law_1.01,0.6816319942474365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,2,power_law_1.2,0.6779903888702392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,2,power_law_1.2,0.6932735919952393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,32,balanced,0.1632373332977295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,32,balanced,0.16331733266512552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,32,power_law_1.01,0.16913919448852538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,32,power_law_1.01,0.1695296049118042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,32,power_law_1.2,0.17240959405899048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,32,power_law_1.2,0.17537920475006102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,4,balanced,0.42264000574747723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,4,balanced,0.423583984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,4,power_law_1.01,0.4113152027130127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,4,power_law_1.01,0.41390080451965333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,4,power_law_1.2,0.40801281929016114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,4,power_law_1.2,0.4116223812103271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,8,balanced,0.28568534056345624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,8,balanced,0.28596266110738117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,8,power_law_1.01,0.28694400787353513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,8,power_law_1.01,0.2874687910079956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,8,power_law_1.2,0.29243519306182864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,1,8,power_law_1.2,0.2948607921600342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,16,1,balanced,0.2115573287010193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,16,1,balanced,0.2134986718495687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,16,1,power_law_1.01,0.21018240451812745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,16,1,power_law_1.01,0.2109055995941162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,16,1,power_law_1.2,0.21128320693969727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,16,1,power_law_1.2,0.2126528024673462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,2,1,balanced,0.6684373219807943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,2,1,balanced,0.6712586879730225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,2,1,power_law_1.01,0.6426688194274902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,2,1,power_law_1.01,0.6430848121643067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,2,1,power_law_1.2,0.6499839782714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,2,1,power_law_1.2,0.6557375907897949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,32,1,balanced,0.1687999963760376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,32,1,balanced,0.1692906618118286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,32,1,power_law_1.01,0.1677183985710144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,32,1,power_law_1.01,0.1679360032081604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,32,1,power_law_1.2,0.1687872052192688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,32,1,power_law_1.2,0.16967040300369263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,4,1,balanced,0.3840693235397339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,4,1,balanced,0.3864159981409709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,4,1,power_law_1.01,0.3730751991271973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,4,1,power_law_1.01,0.3763008117675781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,4,1,power_law_1.2,0.37816319465637205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,4,1,power_law_1.2,0.38005120754241944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,8,1,balanced,0.24945066372553507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,8,1,balanced,0.24996799230575562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,8,1,power_law_1.01,0.2456127882003784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,8,1,power_law_1.01,0.24694399833679198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,8,1,power_law_1.2,0.2475071907043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,6144,2560,8,160,8,1,power_law_1.2,0.24926719665527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,1,balanced,1.881440003712972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,1,balanced,1.8899466196695964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,1,power_law_1.01,1.606015968322754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,1,power_law_1.01,1.6491327285766602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,1,power_law_1.2,1.626540756225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,1,power_law_1.2,1.652992057800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,128,balanced,0.1953386664390564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,128,balanced,0.1954453388849894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,128,power_law_1.01,0.1931071996688843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,128,power_law_1.01,0.19331200122833253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,128,power_law_1.2,0.19392640590667726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,128,power_law_1.2,0.195360004901886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,16,balanced,0.3015893300374349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,16,balanced,0.30426667133967084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,16,power_law_1.01,0.2842303991317749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,16,power_law_1.01,0.28691840171813965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,16,power_law_1.2,0.2907007932662964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,16,power_law_1.2,0.29489281177520754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,2,balanced,1.012495994567871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,2,balanced,1.0131573677062988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,2,power_law_1.01,0.9141119956970215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,2,power_law_1.01,0.9165632247924804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,2,power_law_1.2,0.9186559677124023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,2,power_law_1.2,0.9466752052307129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,256,balanced,0.19113065799077353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,256,balanced,0.19303999344507852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,256,power_law_1.01,0.1895359992980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,256,power_law_1.01,0.18997119665145873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,256,power_law_1.2,0.19187840223312377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,256,power_law_1.2,0.19234559535980225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,32,balanced,0.23214399814605713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,32,balanced,0.23325333992640176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,32,power_law_1.01,0.22085120677947997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,32,power_law_1.01,0.22584319114685059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,32,power_law_1.2,0.2263808012008667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,32,power_law_1.2,0.22814719676971434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,4,balanced,0.6017813285191854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,4,balanced,0.6032266616821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,4,power_law_1.01,0.5504320144653321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,4,power_law_1.01,0.5642240047454834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,4,power_law_1.2,0.5635327816009521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,4,power_law_1.2,0.5713856220245361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,64,balanced,0.19777599970499674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,64,balanced,0.19925866524378458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,64,power_law_1.01,0.19717760086059571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,64,power_law_1.01,0.19883519411087036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,64,power_law_1.2,0.20103681087493896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,64,power_law_1.2,0.20151679515838622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,8,balanced,0.401093324025472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,8,balanced,0.40405865510304767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,8,power_law_1.01,0.38087680339813235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,8,power_law_1.01,0.3860543966293335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,8,power_law_1.2,0.3829823970794678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,1,8,power_law_1.2,0.3887295961380005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,16,1,balanced,0.29335999488830566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,16,1,balanced,0.2956586678822835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,16,1,power_law_1.01,0.26472959518432615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,16,1,power_law_1.01,0.27650558948516846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,16,1,power_law_1.2,0.276857590675354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,16,1,power_law_1.2,0.28336000442504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,2,1,balanced,0.9635626475016276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,2,1,balanced,0.9726400375366211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,2,1,power_law_1.01,0.8397631645202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,2,1,power_law_1.01,0.8785280227661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,2,1,power_law_1.2,0.8635456085205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,2,1,power_law_1.2,0.8921855926513672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,32,1,balanced,0.24408000707626343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,32,1,balanced,0.24478934208552042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,32,1,power_law_1.01,0.23169279098510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,32,1,power_law_1.01,0.23180160522460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,32,1,power_law_1.2,0.23585920333862304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,32,1,power_law_1.2,0.23610880374908447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,4,1,balanced,0.5579893191655477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,4,1,balanced,0.5615573326746622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,4,1,power_law_1.01,0.500819206237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,4,1,power_law_1.01,0.5043456077575683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,4,1,power_law_1.2,0.5128191947937012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,4,1,power_law_1.2,0.5247231960296631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,8,1,balanced,0.38045867284138996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,8,1,balanced,0.38093332449595135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,8,1,power_law_1.01,0.34613120555877686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,8,1,power_law_1.01,0.3489599943161011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,8,1,power_law_1.2,0.35992960929870604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,256,8,1,power_law_1.2,0.3608128070831299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,1,balanced,2.795776049296061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,1,balanced,2.8232107162475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,1,power_law_1.01,2.244588851928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,1,power_law_1.01,2.2534912109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,1,power_law_1.2,2.1793344497680662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,1,power_law_1.2,2.2253887176513674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,128,balanced,0.25251199801762897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,128,balanced,0.25282132625579834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,128,power_law_1.01,0.24952960014343262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,128,power_law_1.01,0.2502016067504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,128,power_law_1.2,0.2493504047393799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,128,power_law_1.2,0.24978559017181395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,16,balanced,0.39908798535664874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,16,balanced,0.399397333463033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,16,power_law_1.01,0.3757888078689575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,16,power_law_1.01,0.37655038833618165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,16,power_law_1.2,0.3737152099609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,16,power_law_1.2,0.3919872045516968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,2,balanced,1.4741172790527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,2,balanced,1.5118613243103027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,2,power_law_1.01,1.2543231964111328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,2,power_law_1.01,1.2605183601379395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,2,power_law_1.2,1.2232128143310548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,2,power_law_1.2,1.2393024444580079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,32,balanced,0.318938672542572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,32,balanced,0.31935999790827435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,32,power_law_1.01,0.2960319995880127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,32,power_law_1.01,0.30227200984954833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,32,power_law_1.2,0.3041984081268311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,32,power_law_1.2,0.3147072076797485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,4,balanced,0.8634293079376221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,4,balanced,0.8635573387145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,4,power_law_1.01,0.7351679801940918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,4,power_law_1.01,0.7784704208374024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,4,power_law_1.2,0.7396671772003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,4,power_law_1.2,0.7910848140716553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,64,balanced,0.2674293319384257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,64,balanced,0.2691253423690796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,64,power_law_1.01,0.26134400367736815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,64,power_law_1.01,0.26375041007995603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,64,power_law_1.2,0.26293120384216306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,64,power_law_1.2,0.26320641040802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,8,balanced,0.5560213327407837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,8,balanced,0.5599626700083414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,8,power_law_1.01,0.4987775802612305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,8,power_law_1.01,0.5007232189178467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,8,power_law_1.2,0.526361608505249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,1,8,power_law_1.2,0.5327040195465088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,16,1,balanced,0.38607998689015705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,16,1,balanced,0.38648001352945965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,16,1,power_law_1.01,0.3541696071624756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,16,1,power_law_1.01,0.3547136068344116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,16,1,power_law_1.2,0.3538496017456055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,16,1,power_law_1.2,0.3539200067520142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,2,1,balanced,1.400261402130127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,2,1,balanced,1.4195094108581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,2,1,power_law_1.01,1.164844799041748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,2,1,power_law_1.01,1.1713919639587402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,2,1,power_law_1.2,1.165004825592041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,2,1,power_law_1.2,1.1666048049926758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,32,1,balanced,0.33244266112645465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,32,1,balanced,0.332479993502299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,32,1,power_law_1.01,0.3010688066482544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,32,1,power_law_1.01,0.30180480480194094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,32,1,power_law_1.2,0.3010240077972412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,32,1,power_law_1.2,0.30230400562286375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,4,1,balanced,0.7962026596069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,4,1,balanced,0.7977706591288248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,4,1,power_law_1.01,0.6825344085693359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,4,1,power_law_1.01,0.6872000217437744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,4,1,power_law_1.2,0.6727424144744873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,4,1,power_law_1.2,0.6820735931396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,8,1,balanced,0.524885336558024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,8,1,balanced,0.5262773434321085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,8,1,power_law_1.01,0.4474624156951904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,8,1,power_law_1.01,0.45462398529052733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,8,1,power_law_1.2,0.44896640777587893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,320,7168,2048,8,384,8,1,power_law_1.2,0.4523712158203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,1,balanced,0.1570186714331309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,1,balanced,0.1574079990386963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,1,power_law_1.01,0.15805439949035643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,1,power_law_1.01,0.1592960000038147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,1,power_law_1.2,0.15983999967575074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,1,power_law_1.2,0.16054400205612182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,128,balanced,0.06229866544405619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,128,balanced,0.0624533345301946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,128,power_law_1.01,0.06085759997367859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,128,power_law_1.01,0.06165120005607605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,128,power_law_1.2,0.06099200248718262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,128,power_law_1.2,0.06146559715270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,16,balanced,0.06229866544405619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,16,balanced,0.06369600196679433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,16,power_law_1.01,0.06350079774856568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,16,power_law_1.01,0.06427519917488098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,16,power_law_1.2,0.06343680024147033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,16,power_law_1.2,0.06409599781036376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,2,balanced,0.11129599809646606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,2,balanced,0.11251733700434367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,2,power_law_1.01,0.11388800144195557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,2,power_law_1.01,0.11649919748306274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,2,power_law_1.2,0.11641600131988525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,2,power_law_1.2,0.11758719682693482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,32,balanced,0.062208001812299095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,32,balanced,0.06228266656398773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,32,power_law_1.01,0.06109439730644226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,32,power_law_1.01,0.06152960062026978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,32,power_law_1.2,0.06231039762496948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,32,power_law_1.2,0.06233599781990051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,4,balanced,0.08884800473848979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,4,balanced,0.0897759993871053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,4,power_law_1.01,0.09128320217132568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,4,power_law_1.01,0.0914687991142273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,4,power_law_1.2,0.09201279878616334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,4,power_law_1.2,0.0921280026435852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,64,balanced,0.06224533418814341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,64,balanced,0.06238933404286703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,64,power_law_1.01,0.06154239773750305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,64,power_law_1.01,0.061561602354049685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,64,power_law_1.2,0.0617792010307312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,64,power_law_1.2,0.061843198537826535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,8,balanced,0.07098133365313213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,8,balanced,0.07215466598669688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,8,power_law_1.01,0.07249280214309692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,8,power_law_1.01,0.0729088008403778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,8,power_law_1.2,0.0737600028514862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,1,8,power_law_1.2,0.07511039972305297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,2,1,balanced,0.10619733730951945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,2,1,balanced,0.10667733351389568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,2,1,power_law_1.01,0.10577919483184814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,2,1,power_law_1.01,0.10611200332641602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,2,1,power_law_1.2,0.1090880036354065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,2,1,power_law_1.2,0.11301120519638061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,4,1,balanced,0.08396800359090169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,4,1,balanced,0.08489599823951721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,4,1,power_law_1.01,0.08417919874191285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,4,1,power_law_1.01,0.08437119722366333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,4,1,power_law_1.2,0.08517119884490967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2048,768,8,128,4,1,power_law_1.2,0.08774399757385254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,1,balanced,0.37318400541941327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,1,balanced,0.37332268555959064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,1,power_law_1.01,0.36367359161376955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,1,power_law_1.01,0.365011191368103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,1,power_law_1.2,0.36307199001312257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,1,power_law_1.2,0.36906239986419676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,128,balanced,0.08240533371766408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,128,balanced,0.08273066580295563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,128,power_law_1.01,0.08181120157241821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,128,power_law_1.01,0.08227840065956116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,128,power_law_1.2,0.08298239707946778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,128,power_law_1.2,0.08304640054702758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,16,balanced,0.09517866373062134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,16,balanced,0.09547199805577596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,16,power_law_1.01,0.09548159837722778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,16,power_law_1.01,0.09699199795722961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,16,power_law_1.2,0.09756159782409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,16,power_law_1.2,0.09961599707603455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,2,balanced,0.2367466688156128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,2,balanced,0.23914132515589395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,2,power_law_1.01,0.2286463975906372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,2,power_law_1.01,0.22875521183013917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,2,power_law_1.2,0.22481920719146728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,2,power_law_1.2,0.2310336112976074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,32,balanced,0.08685333530108134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,32,balanced,0.08819199601809184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,32,power_law_1.01,0.08865919709205627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,32,power_law_1.01,0.08891519904136658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,32,power_law_1.2,0.088646399974823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,32,power_law_1.2,0.09052799940109253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,4,balanced,0.16265066464742026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,4,balanced,0.16268266240755716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,4,power_law_1.01,0.15576319694519042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,4,power_law_1.01,0.15803519487380982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,4,power_law_1.2,0.15838719606399537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,4,power_law_1.2,0.1597440004348755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,64,balanced,0.08318933347860973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,64,balanced,0.08478933572769165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,64,power_law_1.01,0.08316799998283386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,64,power_law_1.01,0.0840448021888733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,64,power_law_1.2,0.08368639945983887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,64,power_law_1.2,0.08483840227127075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,8,balanced,0.1237333317597707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,8,balanced,0.12432533502578735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,8,power_law_1.01,0.12166399955749511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,8,power_law_1.01,0.12188800573348998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,8,power_law_1.2,0.12279679775238037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,1,8,power_law_1.2,0.12457599639892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,16,1,balanced,0.3325653274854024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,16,1,balanced,0.335749348004659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,16,1,power_law_1.01,0.3357631921768188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,16,1,power_law_1.01,0.3375296115875244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,16,1,power_law_1.2,0.34734721183776857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,16,1,power_law_1.2,0.34829440116882326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,2,1,balanced,0.2232266664505005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,2,1,balanced,0.22409067551294962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,2,1,power_law_1.01,0.21330559253692627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,2,1,power_law_1.01,0.21543679237365723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,2,1,power_law_1.2,0.21714560985565184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,2,1,power_law_1.2,0.21957759857177733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,32,1,balanced,0.29711467027664185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,32,1,balanced,0.29763732353846234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,32,1,power_law_1.01,0.3000511884689331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,32,1,power_law_1.01,0.300927996635437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,32,1,power_law_1.2,0.31040000915527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,32,1,power_law_1.2,0.31512320041656494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,4,1,balanced,0.14684266845385233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,4,1,balanced,0.14699199795722961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,4,1,power_law_1.01,0.14260480403900147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,4,1,power_law_1.01,0.14296319484710693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,4,1,power_law_1.2,0.1437440037727356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,4,1,power_law_1.2,0.14543999433517457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,8,1,balanced,0.43397335211435956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,8,1,balanced,0.43483734130859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,8,1,power_law_1.01,0.43903360366821287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,8,1,power_law_1.01,0.43967361450195314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,8,1,power_law_1.2,0.4512063980102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,2688,1856,6,128,8,1,power_law_1.2,0.45331201553344724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,1,balanced,0.6223839918772379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,1,balanced,0.6238666772842407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,1,power_law_1.01,0.5566592216491699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,1,power_law_1.01,0.5673279762268066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,1,power_law_1.2,0.574073600769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,1,power_law_1.2,0.5774784088134766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,128,balanced,0.11736533045768738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,128,balanced,0.11797866225242615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,128,power_law_1.01,0.11663999557495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,128,power_law_1.01,0.11701120138168335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,128,power_law_1.2,0.11739519834518433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,128,power_law_1.2,0.11754879951477051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,16,balanced,0.15292267004648843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,16,balanced,0.15389333168665567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,16,power_law_1.01,0.1472640037536621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,16,power_law_1.01,0.1478271961212158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,16,power_law_1.2,0.14895999431610107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,16,power_law_1.2,0.1505344033241272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,2,balanced,0.3829333384831746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,2,balanced,0.3832906484603882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,2,power_law_1.01,0.3514111995697021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,2,power_law_1.01,0.35425920486450196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,2,power_law_1.2,0.3503360033035278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,2,power_law_1.2,0.35599360466003416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,256,balanced,0.11555733283360799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,256,balanced,0.11726400256156921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,256,power_law_1.01,0.11585279703140258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,256,power_law_1.01,0.11615359783172607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,256,power_law_1.2,0.11608320474624634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,256,power_law_1.2,0.1162559986114502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,32,balanced,0.12826133767763773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,32,balanced,0.12934933106104532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,32,power_law_1.01,0.12752000093460084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,32,power_law_1.01,0.12776960134506227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,32,power_law_1.2,0.12946560382843017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,32,power_law_1.2,0.12975360155105592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,4,balanced,0.25340267022450763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,4,balanced,0.2537333369255066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,4,power_law_1.01,0.24289920330047607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,4,power_law_1.01,0.2459968090057373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,4,power_law_1.2,0.23955199718475342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,4,power_law_1.2,0.24257919788360596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,64,balanced,0.11959999799728394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,64,balanced,0.12175466616948445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,64,power_law_1.01,0.12081279754638671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,64,power_law_1.01,0.1210752010345459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,64,power_law_1.2,0.12149120569229126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,64,power_law_1.2,0.12195839881896972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,8,balanced,0.18474133809407553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,8,balanced,0.18668266137441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,8,power_law_1.01,0.17731200456619262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,8,power_law_1.01,0.17842559814453124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,8,power_law_1.2,0.18218239545822143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,1,8,power_law_1.2,0.1823232054710388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,16,1,balanced,0.14366933703422546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,16,1,balanced,0.1439413328965505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,16,1,power_law_1.01,0.1343808054924011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,16,1,power_law_1.01,0.13549439907073973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,16,1,power_law_1.2,0.14013439416885376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,16,1,power_law_1.2,0.14046080112457277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,2,1,balanced,0.35436801115671795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,2,1,balanced,0.35541868209838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,2,1,power_law_1.01,0.3256959915161133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,2,1,power_law_1.01,0.32805120944976807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,2,1,power_law_1.2,0.3285376071929932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,2,1,power_law_1.2,0.334553599357605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,32,1,balanced,0.1237333317597707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,32,1,balanced,0.12570133805274963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,32,1,power_law_1.01,0.11699199676513672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,32,1,power_law_1.01,0.11722240447998047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,32,1,power_law_1.2,0.12024960517883301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,32,1,power_law_1.2,0.12030080556869507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,4,1,balanced,0.22763733069101968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,4,1,balanced,0.22835199038187662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,4,1,power_law_1.01,0.2111423969268799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,4,1,power_law_1.01,0.2129983901977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,4,1,power_law_1.2,0.21647360324859619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,4,1,power_law_1.2,0.21863679885864257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,8,1,balanced,0.1681493322054545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,8,1,balanced,0.16879467169443765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,8,1,power_law_1.01,0.15750399827957154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,8,1,power_law_1.01,0.15902719497680665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,8,1,power_law_1.2,0.1602560043334961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,3072,1536,8,256,8,1,power_law_1.2,0.16273280382156372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,1,balanced,0.4259093205134074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,1,balanced,0.42614932854970294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,1,power_law_1.01,0.4710527896881104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,1,power_law_1.01,0.47555837631225584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,1,power_law_1.2,0.46976637840270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,1,power_law_1.2,0.4786240100860596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,2,balanced,0.26344533761342365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,2,balanced,0.26449066400527954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,2,power_law_1.01,0.3118272066116333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,2,power_law_1.01,0.3146559953689575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,2,power_law_1.2,0.3117439985275269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,2,power_law_1.2,0.3292288064956665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,4,balanced,0.2098133365313212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,4,balanced,0.21031999588012695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,4,power_law_1.01,0.24081919193267823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,4,power_law_1.01,0.2445823907852173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,4,power_law_1.2,0.23420801162719726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,4,power_law_1.2,0.23601279258728028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,8,balanced,0.18327999114990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,8,balanced,0.18704533576965332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,8,power_law_1.01,0.2111743927001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,8,power_law_1.01,0.2151360034942627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,8,power_law_1.2,0.2133120059967041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,1,8,power_law_1.2,0.2141632080078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,16,1,balanced,0.0678719977537791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,16,1,balanced,0.07450133562088013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,16,1,power_law_1.01,0.07311360239982605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,16,1,power_law_1.01,0.07395200133323669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,16,1,power_law_1.2,0.07290239930152893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,16,1,power_law_1.2,0.07445759773254394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,2,1,balanced,0.23878933986028036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,2,1,balanced,0.23909332354863486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,2,1,power_law_1.01,0.245580792427063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,2,1,power_law_1.01,0.24904320240020753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,2,1,power_law_1.2,0.24707200527191162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,2,1,power_law_1.2,0.24896640777587892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,32,1,balanced,0.05482133229573568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,32,1,balanced,0.056133334835370384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,32,1,power_law_1.01,0.052172797918319705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,32,1,power_law_1.01,0.05273600220680237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,32,1,power_law_1.2,0.05361279845237732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,32,1,power_law_1.2,0.05910400152206421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,4,1,balanced,0.146314670642217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,4,1,balanced,0.14847999811172485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,4,1,power_law_1.01,0.14534399509429932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,4,1,power_law_1.01,0.14796799421310425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,4,1,power_law_1.2,0.14620159864425658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,4,1,power_law_1.2,0.14856319427490233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,8,1,balanced,0.10250666737556458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,8,1,balanced,0.10261866450309753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,8,1,power_law_1.01,0.09836159944534302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,8,1,power_law_1.01,0.10051840543746948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,8,1,power_law_1.2,0.10020480155944825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,14336,2,8,8,1,power_law_1.2,0.10289280414581299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,1,balanced,0.44460801283518475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,1,balanced,0.4480373462041219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,1,power_law_1.01,0.4386303901672363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,1,power_law_1.01,0.4517695903778076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,1,power_law_1.2,0.45664639472961427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,1,power_law_1.2,0.45703678131103515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,128,balanced,0.09745599826176961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,128,balanced,0.09770133097966512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,128,power_law_1.01,0.09796479940414429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,128,power_law_1.01,0.09826560020446777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,128,power_law_1.2,0.09809280037879944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,128,power_law_1.2,0.0987775981426239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,16,balanced,0.11134399970372517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,16,balanced,0.1136799951394399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,16,power_law_1.01,0.11658240556716919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,16,power_law_1.01,0.12159359455108643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,16,power_law_1.2,0.11994240283966065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,16,power_law_1.2,0.1212224006652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,2,balanced,0.2785173257191976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,2,balanced,0.2808213432629903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,2,power_law_1.01,0.2809344053268433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,2,power_law_1.01,0.2894335985183716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,2,power_law_1.2,0.2868671894073486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,2,power_law_1.2,0.2915328025817871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,32,balanced,0.1032533347606659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,32,power_law_1.01,0.10506880283355713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,32,power_law_1.01,0.10572160482406616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,32,power_law_1.2,0.10734720230102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,32,power_law_1.2,0.10768640041351318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,4,balanced,0.18822934230168661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,4,balanced,0.19075200955073038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,4,power_law_1.01,0.19541759490966798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,4,power_law_1.01,0.1962815999984741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,4,power_law_1.2,0.1929919958114624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,4,power_law_1.2,0.19896320104599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,64,balanced,0.09925867120424907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,64,balanced,0.1011253297328949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,64,power_law_1.01,0.10151679515838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,64,power_law_1.01,0.10152319669723511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,64,power_law_1.2,0.10165120363235473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,64,power_law_1.2,0.1032639980316162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,8,balanced,0.1450933317343394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,8,balanced,0.14591466387112936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,8,power_law_1.01,0.14885120391845702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,8,power_law_1.01,0.14960639476776122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,8,power_law_1.2,0.14814720153808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,1,8,power_law_1.2,0.14974720478057862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,16,1,balanced,0.11555199821790059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,16,1,balanced,0.11566399534543355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,16,1,power_law_1.01,0.11553280353546143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,16,1,power_law_1.01,0.11624319553375244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,16,1,power_law_1.2,0.11675519943237304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,16,1,power_law_1.2,0.11690239906311035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,2,1,balanced,0.2635626594225566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,2,1,balanced,0.2659839987754822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,2,1,power_law_1.01,0.2624703884124756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,2,1,power_law_1.01,0.26363520622253417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,2,1,power_law_1.2,0.2671231985092163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,2,1,power_law_1.2,0.26715519428253176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,32,1,balanced,0.10533866286277771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,32,1,balanced,0.1062506635983785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,32,1,power_law_1.01,0.10680320262908935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,32,1,power_law_1.01,0.10714880228042603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,32,1,power_law_1.2,0.10840320587158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,32,1,power_law_1.2,0.10887680053710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,4,1,balanced,0.17339199781417847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,4,1,balanced,0.17511999607086182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,4,1,power_law_1.01,0.17179520130157472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,4,1,power_law_1.01,0.17184000015258788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,4,1,power_law_1.2,0.1804159998893738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,4,1,power_law_1.2,0.18099839687347413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,8,1,balanced,0.13175466656684875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,8,1,balanced,0.13216533263524374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,8,1,power_law_1.01,0.13343360424041747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,8,1,power_law_1.01,0.13388799428939818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,8,1,power_law_1.2,0.1451647996902466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,1536,8,128,8,1,power_law_1.2,0.14545279741287231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,1,balanced,2.844282786051432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,1,balanced,2.8913065592447915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,1,power_law_1.01,2.6461055755615233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,1,power_law_1.01,2.652288055419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,1,power_law_1.2,2.7517696380615235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,1,power_law_1.2,2.7635135650634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,128,balanced,0.3693813482920329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,128,balanced,0.36977068583170575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,128,power_law_1.01,0.3711872100830078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,128,power_law_1.01,0.37128961086273193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,128,power_law_1.2,0.3740799903869629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,128,power_law_1.2,0.3775615930557251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,16,balanced,0.5264319976170858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,16,balanced,0.527946670850118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,16,power_law_1.01,0.5167871952056885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,16,power_law_1.01,0.5196224212646484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,16,power_law_1.2,0.5200191974639893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,16,power_law_1.2,0.5264768123626709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,2,balanced,1.5840373039245605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,2,balanced,1.6063040097554524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,2,power_law_1.01,1.5107647895812988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,2,power_law_1.01,1.5249343872070313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,2,power_law_1.2,1.544870376586914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,2,power_law_1.2,1.5617792129516601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,256,balanced,0.3631253242492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,256,balanced,0.3638399839401245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,256,power_law_1.01,0.36471679210662844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,256,power_law_1.01,0.36516480445861815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,256,power_law_1.2,0.36463360786437987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,256,power_law_1.2,0.3666815996170044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,32,balanced,0.437173326810201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,32,balanced,0.44064001242319745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,32,power_law_1.01,0.4344319820404053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,32,power_law_1.01,0.4389823913574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,32,power_law_1.2,0.44185600280761717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,32,power_law_1.2,0.4451200008392334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,4,balanced,0.9792053699493408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,4,balanced,0.9832746982574463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,4,power_law_1.01,0.9465727806091309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,4,power_law_1.01,0.9503104209899902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,4,power_law_1.2,0.975436782836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,4,power_law_1.2,0.9771840095520019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,64,balanced,0.3893119891484578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,64,balanced,0.38947200775146484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,64,power_law_1.01,0.39378559589385986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,64,power_law_1.01,0.3989120006561279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,64,power_law_1.2,0.4026303768157959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,64,power_law_1.2,0.404691219329834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,8,balanced,0.6793920199076334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,8,balanced,0.6795573234558105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,8,power_law_1.01,0.660697603225708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,8,power_law_1.01,0.6649407863616943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,8,power_law_1.2,0.6769472122192383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,1,8,power_law_1.2,0.6825791835784912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,16,1,balanced,2.3288373947143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,16,1,balanced,2.3317386309305825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,16,1,power_law_1.01,2.294758415222168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,16,1,power_law_1.01,2.3027263641357423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,16,1,power_law_1.2,2.391993522644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,16,1,power_law_1.2,2.3956735610961912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,2,1,balanced,1.4801759719848633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,2,1,balanced,1.5142985979715984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,2,1,power_law_1.01,1.3663423538208008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,2,1,power_law_1.01,1.3812735557556153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,2,1,power_law_1.2,1.4289919853210449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,2,1,power_law_1.2,1.4420096397399902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,32,1,balanced,1.8103893597920735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,32,1,balanced,1.811903953552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,32,1,power_law_1.01,1.784979248046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,32,1,power_law_1.01,1.8089471817016602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,32,1,power_law_1.2,1.853241539001465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,32,1,power_law_1.2,1.8799999237060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,4,1,balanced,0.839792013168335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,4,1,balanced,0.8419146537780762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,4,1,power_law_1.01,0.805081558227539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,4,1,power_law_1.01,0.8088512420654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,4,1,power_law_1.2,0.8325695991516113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,4,1,power_law_1.2,0.833407974243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,8,1,balanced,0.5335253477096558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,8,1,balanced,0.5335946480433146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,8,1,power_law_1.01,0.5159423828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,8,1,power_law_1.01,0.5162303924560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,8,1,power_law_1.2,0.5360896110534668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,4096,2688,22,512,8,1,power_law_1.2,0.537497615814209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,1,balanced,0.6887040138244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,1,balanced,0.6942613124847412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,1,power_law_1.01,0.7064064025878907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,1,power_law_1.01,0.724076795578003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,1,power_law_1.2,0.7116608142852783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,1,power_law_1.2,0.7271615982055664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,2,balanced,0.4006719986597697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,2,balanced,0.40724798043568927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,2,power_law_1.01,0.47687039375305174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,2,power_law_1.01,0.49752321243286135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,2,power_law_1.2,0.5127359867095947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,2,power_law_1.2,0.5200960159301757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,4,balanced,0.2696053385734558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,4,balanced,0.27194666862487793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,4,power_law_1.01,0.3038784027099609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,4,power_law_1.01,0.30668799877166747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,4,power_law_1.2,0.3203775882720947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,4,power_law_1.2,0.321996808052063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,8,balanced,0.22523732980092367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,8,balanced,0.23214399814605713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,8,power_law_1.01,0.2630592107772827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,8,power_law_1.01,0.26502399444580077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,8,power_law_1.2,0.2641535997390747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,1,8,power_law_1.2,0.26771841049194334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,16,1,balanced,0.09424533446629842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,16,1,balanced,0.09708799918492635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,16,1,power_law_1.01,0.09299200177192687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,16,1,power_law_1.01,0.09304320216178893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,16,1,power_law_1.2,0.09299839735031128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,16,1,power_law_1.2,0.09319040179252625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,2,1,balanced,0.3468053340911865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,2,1,balanced,0.3472586472829183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,2,1,power_law_1.01,0.352345609664917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,2,1,power_law_1.01,0.36129920482635497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,2,1,power_law_1.2,0.35262720584869384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,2,1,power_law_1.2,0.3650304079055786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,32,1,balanced,0.08298666775226593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,32,1,balanced,0.08378133177757263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,32,1,power_law_1.01,0.0812287986278534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,32,1,power_law_1.01,0.08218240141868591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,32,1,power_law_1.2,0.08079360127449035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,32,1,power_law_1.2,0.08144639730453491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,4,1,balanced,0.20256533225377402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,4,1,balanced,0.20481600364049277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,4,1,power_law_1.01,0.20426878929138184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,4,1,power_law_1.01,0.20510079860687255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,4,1,power_law_1.2,0.20307838916778564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,4,1,power_law_1.2,0.20609281063079835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,8,1,balanced,0.13597333431243896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,8,1,balanced,0.13974933822949728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,8,1,power_law_1.01,0.134278404712677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,8,1,power_law_1.01,0.13671679496765138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,8,1,power_law_1.2,0.13393280506134034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,16384,2,8,8,1,power_law_1.2,0.13730560541152953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,1,balanced,1.6183679898579915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,1,balanced,1.6325546900431316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,1,power_law_1.01,1.4356032371520997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,1,power_law_1.01,1.4483903884887694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,1,power_law_1.2,1.436467170715332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,1,power_law_1.2,1.4654784202575684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,128,balanced,0.1883359948794047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,128,balanced,0.18914133310317993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,128,power_law_1.01,0.1867136001586914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,128,power_law_1.01,0.18681600093841552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,128,power_law_1.2,0.18731520175933838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,128,power_law_1.2,0.18934400081634523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,16,balanced,0.2770826617876689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,16,balanced,0.27722134192784625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,16,power_law_1.01,0.2649280071258545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,16,power_law_1.01,0.2712064027786255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,16,power_law_1.2,0.2705215930938721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,16,power_law_1.2,0.2742784023284912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,2,balanced,0.8904319604237875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,2,balanced,0.8951040108998617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,2,power_law_1.01,0.8052864074707031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,2,power_law_1.01,0.8179967880249024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,2,power_law_1.2,0.8334719657897949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,2,power_law_1.2,0.8390399932861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,256,balanced,0.18487467368443808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,256,balanced,0.18652266263961792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,256,power_law_1.01,0.1841472029685974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,256,power_law_1.01,0.1848512053489685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,256,power_law_1.2,0.184716796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,256,power_law_1.2,0.18551679849624633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,32,balanced,0.2153653303782145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,32,balanced,0.21713600556055704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,32,power_law_1.01,0.20977919101715087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,32,power_law_1.01,0.21412479877471924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,32,power_law_1.2,0.22168319225311278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,32,power_law_1.2,0.2232896089553833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,4,balanced,0.5381066799163818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,4,balanced,0.5393866697947184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,4,power_law_1.01,0.5027135848999024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,4,power_law_1.01,0.5234432220458984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,4,power_law_1.2,0.5037888050079345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,4,power_law_1.2,0.5112639904022217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,64,balanced,0.19114667177200317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,64,balanced,0.19124799966812134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,64,power_law_1.01,0.19000320434570311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,64,power_law_1.01,0.19044480323791504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,64,power_law_1.2,0.1940608024597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,64,power_law_1.2,0.19442559480667115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,8,balanced,0.36556800206502277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,8,balanced,0.3658133347829183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,8,power_law_1.01,0.3465984106063843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,8,power_law_1.01,0.3517888069152832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,8,power_law_1.2,0.3493760108947754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,1,8,power_law_1.2,0.35141758918762206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,16,1,balanced,0.262661337852478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,16,1,balanced,0.2627413272857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,16,1,power_law_1.01,0.24712960720062255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,16,1,power_law_1.01,0.24750080108642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,16,1,power_law_1.2,0.25284481048583984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,16,1,power_law_1.2,0.25388801097869873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,2,1,balanced,0.8389493624369303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,2,1,balanced,0.8512053489685059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,2,1,power_law_1.01,0.7542719841003418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,2,1,power_law_1.01,0.7585472106933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,2,1,power_law_1.2,0.7800576210021972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,2,1,power_law_1.2,0.7892096042633057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,32,1,balanced,0.2207733392715454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,32,1,balanced,0.22187199195226034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,32,1,power_law_1.01,0.2099839925765991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,32,1,power_law_1.01,0.2114880084991455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,32,1,power_law_1.2,0.21332480907440185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,32,1,power_law_1.2,0.2135999917984009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,4,1,balanced,0.48922133445739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,4,1,balanced,0.48931201299031574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,4,1,power_law_1.01,0.45500798225402833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,4,1,power_law_1.01,0.46528000831604005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,4,1,power_law_1.2,0.4608191967010498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,4,1,power_law_1.2,0.4752255916595459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,8,1,balanced,0.3328533371289571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,8,1,balanced,0.33369600772857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,8,1,power_law_1.01,0.31461119651794434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,8,1,power_law_1.01,0.315833592414856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,8,1,power_law_1.2,0.31945600509643557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2048,8,256,8,1,power_law_1.2,0.32048640251159666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,1,balanced,1.2640159924825032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,1,balanced,1.2675893306732178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,1,power_law_1.01,1.2125823974609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,1,power_law_1.01,1.224345588684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,1,power_law_1.2,1.246617603302002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,1,power_law_1.2,1.2483200073242187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,16,balanced,0.23047999540964761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,16,balanced,0.23069866498311362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,16,power_law_1.01,0.23066239356994628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,16,power_law_1.01,0.2325376033782959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,16,power_law_1.2,0.23257598876953126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,16,power_law_1.2,0.23554561138153077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,2,balanced,0.7095359961191813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,2,balanced,0.7108906904856364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,2,power_law_1.01,0.6933695793151855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,2,power_law_1.01,0.705625581741333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,2,power_law_1.2,0.7085567951202393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,2,power_law_1.2,0.7188096046447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,32,balanced,0.17264533042907715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,32,balanced,0.17452800273895264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,32,power_law_1.01,0.18545279502868653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,32,power_law_1.01,0.18684799671173097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,32,power_law_1.2,0.196288001537323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,32,power_law_1.2,0.19955840110778808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,4,balanced,0.4358186721801758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,4,balanced,0.43587732315063477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,4,power_law_1.01,0.4321599960327148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,4,power_law_1.01,0.437497615814209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,4,power_law_1.2,0.4345536231994629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,4,power_law_1.2,0.4450943946838379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,8,balanced,0.2972319920857747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,8,balanced,0.29843733708063763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,8,power_law_1.01,0.29697279930114745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,8,power_law_1.01,0.29799039363861085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,8,power_law_1.2,0.30554239749908446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,1,8,power_law_1.2,0.30737919807434083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,16,1,balanced,0.2188160022099813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,16,1,balanced,0.2192373275756836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,16,1,power_law_1.01,0.21583359241485595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,16,1,power_law_1.01,0.2182080030441284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,16,1,power_law_1.2,0.21967360973358155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,16,1,power_law_1.2,0.21980159282684325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,2,1,balanced,0.6781013011932373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,2,1,balanced,0.6815093358357748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,2,1,power_law_1.01,0.6580992221832276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,2,1,power_law_1.01,0.6642623901367187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,2,1,power_law_1.2,0.6704319953918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,2,1,power_law_1.2,0.6705344200134278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,32,1,balanced,0.17266666889190674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,32,1,balanced,0.17492266496022543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,32,1,power_law_1.01,0.17477760314941407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,32,1,power_law_1.01,0.1753216028213501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,32,1,power_law_1.2,0.17621760368347167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,32,1,power_law_1.2,0.1771008014678955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,4,1,balanced,0.3926933209101359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,4,1,balanced,0.3947039842605591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,4,1,power_law_1.01,0.3849792003631592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,4,1,power_law_1.01,0.38904318809509275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,4,1,power_law_1.2,0.38950400352478026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,4,1,power_law_1.2,0.393939208984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,8,1,balanced,0.2569173375765483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,8,1,balanced,0.257146676381429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,8,1,power_law_1.01,0.25487360954284666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,8,1,power_law_1.01,0.25544960498809816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,8,1,power_law_1.2,0.26133759021759034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,6144,2560,8,160,8,1,power_law_1.2,0.26537599563598635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,1,balanced,1.892240047454834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,1,balanced,1.8969173431396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,1,power_law_1.01,1.6166656494140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,1,power_law_1.01,1.6211904525756835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,1,power_law_1.2,1.675071907043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,1,power_law_1.2,1.7064512252807618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,128,balanced,0.20586667458216348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,128,balanced,0.20708266894022623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,128,power_law_1.01,0.20499839782714843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,128,power_law_1.01,0.20514559745788574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,128,power_law_1.2,0.20714879035949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,128,power_law_1.2,0.20719358921051026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,16,balanced,0.3126986622810364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,16,balanced,0.31332266330718994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,16,power_law_1.01,0.2957312107086182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,16,power_law_1.01,0.30281600952148435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,16,power_law_1.2,0.3026047945022583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,16,power_law_1.2,0.30353920459747313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,2,balanced,1.025439977645874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,2,balanced,1.025701363881429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,2,power_law_1.01,0.9161536216735839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,2,power_law_1.01,0.918553638458252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,2,power_law_1.2,0.9485119819641114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,2,power_law_1.2,0.9640064239501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,256,balanced,0.20312533775965372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,256,balanced,0.20332266887029013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,256,power_law_1.01,0.20147199630737306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,256,power_law_1.01,0.20258560180664062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,256,power_law_1.2,0.20225279331207274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,256,power_law_1.2,0.2023103952407837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,32,balanced,0.24286399284998575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,32,balanced,0.24314665794372559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,32,power_law_1.01,0.2364032030105591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,32,power_law_1.01,0.24033279418945314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,32,power_law_1.2,0.24443519115447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,32,power_law_1.2,0.2454848051071167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,4,balanced,0.6128053267796835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,4,balanced,0.6157439947128296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,4,power_law_1.01,0.5593984127044678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,4,power_law_1.01,0.5761919975280761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,4,power_law_1.2,0.5818816184997558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,4,power_law_1.2,0.5831488132476806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,64,balanced,0.20969067017237344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,64,balanced,0.21036267280578613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,64,power_law_1.01,0.20782079696655273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,64,power_law_1.01,0.20861439704895018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,64,power_law_1.2,0.2150144100189209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,64,power_law_1.2,0.2159424066543579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,8,balanced,0.41330134868621826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,8,balanced,0.4166080156962077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,8,power_law_1.01,0.39468159675598147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,8,power_law_1.01,0.40010881423950195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,8,power_law_1.2,0.3888063907623291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,1,8,power_law_1.2,0.40227198600769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,16,1,balanced,0.3001546661059062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,16,1,balanced,0.301199992497762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,16,1,power_law_1.01,0.2829952001571655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,16,1,power_law_1.01,0.28757760524749754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,16,1,power_law_1.2,0.2925568103790283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,16,1,power_law_1.2,0.2933439970016479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,2,1,balanced,0.9690773487091064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,2,1,balanced,0.975658655166626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,2,1,power_law_1.01,0.8780991554260253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,2,1,power_law_1.01,0.8834495544433594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,2,1,power_law_1.2,0.8868032455444336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,2,1,power_law_1.2,0.8897279739379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,32,1,balanced,0.2499786615371704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,32,1,balanced,0.2505173285802205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,32,1,power_law_1.01,0.24090878963470458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,32,1,power_law_1.01,0.24202239513397217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,32,1,power_law_1.2,0.24432001113891602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,32,1,power_law_1.2,0.24463999271392822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,4,1,balanced,0.566271980603536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,4,1,balanced,0.5672213236490885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,4,1,power_law_1.01,0.5262656211853027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,4,1,power_law_1.01,0.5327040195465088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,4,1,power_law_1.2,0.5347839832305908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,4,1,power_law_1.2,0.5367680072784424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,8,1,balanced,0.38499200344085693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,8,1,balanced,0.3853439887364705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,8,1,power_law_1.01,0.3574847936630249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,8,1,power_law_1.01,0.36615040302276614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,8,1,power_law_1.2,0.36865279674530027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,256,8,1,power_law_1.2,0.37420799732208254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,1,balanced,2.84004815419515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,1,balanced,2.8999786376953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,1,power_law_1.01,2.252243232727051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,1,power_law_1.01,2.3127296447753904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,1,power_law_1.2,2.2557567596435546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,1,power_law_1.2,2.2719743728637694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,128,balanced,0.26202666759490967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,128,balanced,0.2627413272857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,128,power_law_1.01,0.25931520462036134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,128,power_law_1.01,0.26031999588012694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,128,power_law_1.2,0.26093440055847167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,128,power_law_1.2,0.2617151975631714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,16,balanced,0.4100639820098877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,16,balanced,0.41201066970825195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,16,power_law_1.01,0.38442239761352537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,16,power_law_1.01,0.39829120635986326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,16,power_law_1.2,0.3829119920730591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,16,power_law_1.2,0.3885567903518677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,2,balanced,1.4861173629760742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,2,balanced,1.5247893333435059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,2,power_law_1.01,1.269542407989502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,2,power_law_1.01,1.3051520347595216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,2,power_law_1.2,1.2700480461120605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,2,power_law_1.2,1.2769920349121093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,32,balanced,0.33022934198379517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,32,balanced,0.33029866218566895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,32,power_law_1.01,0.3147711992263794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,32,power_law_1.01,0.3185728073120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,32,power_law_1.2,0.3104896068572998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,32,power_law_1.2,0.32529919147491454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,4,balanced,0.8759733041127523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,4,balanced,0.8771893183390299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,4,power_law_1.01,0.7632319927215576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,4,power_law_1.01,0.7841472148895263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,4,power_law_1.2,0.7554368019104004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,4,power_law_1.2,0.7785024166107177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,64,balanced,0.2791573405265808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,64,balanced,0.27937066555023193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,64,power_law_1.01,0.2714560031890869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,64,power_law_1.01,0.2756351947784424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,64,power_law_1.2,0.27560958862304685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,64,power_law_1.2,0.2785664081573486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,8,balanced,0.5688639879226685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,8,balanced,0.570688009262085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,8,power_law_1.01,0.5247744083404541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,8,power_law_1.01,0.5327167987823487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,8,power_law_1.2,0.5045119762420655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,1,8,power_law_1.2,0.5478847980499267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,16,1,balanced,0.39233068625132245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,16,1,balanced,0.39267198244730633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,16,1,power_law_1.01,0.3595648050308228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,16,1,power_law_1.01,0.36104960441589357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,16,1,power_law_1.2,0.3574656009674072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,16,1,power_law_1.2,0.3612799882888794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,2,1,balanced,1.4122613271077473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,2,1,balanced,1.4508959452311199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,2,1,power_law_1.01,1.173964786529541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,2,1,power_law_1.01,1.1799936294555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,2,1,power_law_1.2,1.1715007781982423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,2,1,power_law_1.2,1.1834048271179198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,32,1,balanced,0.33824535210927326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,32,1,balanced,0.3386293252309163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,32,1,power_law_1.01,0.308735990524292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,32,1,power_law_1.01,0.3094144105911255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,32,1,power_law_1.2,0.3093247890472412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,32,1,power_law_1.2,0.3113152027130127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,4,1,balanced,0.8047893047332764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,4,1,balanced,0.8065280119578043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,4,1,power_law_1.01,0.6893504142761231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,4,1,power_law_1.01,0.697049617767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,4,1,power_law_1.2,0.6928127765655517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,4,1,power_law_1.2,0.696614408493042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,8,1,balanced,0.5320853392283121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,8,1,balanced,0.5328266620635986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,8,1,power_law_1.01,0.4587264060974121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,8,1,power_law_1.01,0.4624767780303955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,8,1,power_law_1.2,0.46384639739990235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,384,7168,2048,8,384,8,1,power_law_1.2,0.4654975891113281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,1,balanced,0.050944000482559204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,1,balanced,0.05169066786766052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,1,power_law_1.01,0.04871039986610413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,1,power_law_1.01,0.04888960123062134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,1,power_law_1.2,0.046515199542045596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,1,power_law_1.2,0.0468095988035202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,128,balanced,0.02731200059254964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,128,balanced,0.029317334294319153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,128,power_law_1.01,0.026643198728561402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,128,power_law_1.01,0.026745599508285523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,128,power_law_1.2,0.026579201221466064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,128,power_law_1.2,0.026655998826026917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,16,balanced,0.02735999971628189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,16,balanced,0.029194665451844532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,16,power_law_1.01,0.0308351993560791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,16,power_law_1.01,0.03108479976654053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,16,power_law_1.2,0.030752000212669373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,16,power_law_1.2,0.031040000915527343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,2,balanced,0.03826133410135905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,2,balanced,0.041738669077555336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,2,power_law_1.01,0.044582399725914004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,2,power_law_1.01,0.045203199982643126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,2,power_law_1.2,0.04246399998664856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,2,power_law_1.2,0.04371199905872345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,32,balanced,0.027306665976842243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,32,balanced,0.02914133419593175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,32,power_law_1.01,0.02776319980621338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,32,power_law_1.01,0.027923199534416198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,32,power_law_1.2,0.02797439992427826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,32,power_law_1.2,0.02826879918575287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,4,balanced,0.03148799886306127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,4,balanced,0.031957333286603294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,4,power_law_1.01,0.03758080005645752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,4,power_law_1.01,0.037785598635673524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,4,power_law_1.2,0.035743999481201175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,4,power_law_1.2,0.03606399893760681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,64,balanced,0.02743999908367793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,64,balanced,0.029264000554879505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,64,power_law_1.01,0.026617598533630372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,64,power_law_1.01,0.027116799354553224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,64,power_law_1.2,0.027270400524139406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,64,power_law_1.2,0.02736000120639801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,8,balanced,0.02884799987077713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,8,balanced,0.029461334149042766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,8,power_law_1.01,0.03529599905014038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,8,power_law_1.01,0.0357120007276535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,8,power_law_1.2,0.034508800506591795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,1,8,power_law_1.2,0.03470079898834229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,2,1,balanced,0.03214933226505915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,2,1,balanced,0.03350933392842611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,2,1,power_law_1.01,0.03345920145511627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,2,1,power_law_1.01,0.03356159925460815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,2,1,power_law_1.2,0.032646399736404416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,2,1,power_law_1.2,0.03342080116271973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,4,1,balanced,0.02739733209212621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,4,1,balanced,0.02842666705449422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,4,1,power_law_1.01,0.02720640003681183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,4,1,power_law_1.01,0.02865920066833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,4,1,power_law_1.2,0.0278656005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2048,768,8,128,4,1,power_law_1.2,0.02831999957561493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,1,balanced,0.0906773308912913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,1,balanced,0.09152000149091084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,1,power_law_1.01,0.08896639943122864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,1,power_law_1.01,0.08960000276565552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,1,power_law_1.2,0.08852480053901672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,1,power_law_1.2,0.08933119773864746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,128,balanced,0.03152533372243246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,128,balanced,0.03187733391920725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,128,power_law_1.01,0.030636799335479737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,128,power_law_1.01,0.030694401264190672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,128,power_law_1.2,0.030508801341056824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,128,power_law_1.2,0.031193599104881287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,16,balanced,0.033701332906881966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,16,balanced,0.035717333356539406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,16,power_law_1.01,0.04505600035190582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,16,power_law_1.01,0.047884801030159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,16,power_law_1.2,0.04950399994850159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,16,power_law_1.2,0.05021439790725708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,2,balanced,0.06566933294137318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,2,balanced,0.06574933230876923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,2,power_law_1.01,0.06670079827308655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,2,power_law_1.01,0.06889600157737732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,2,power_law_1.2,0.07292159795761108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,2,power_law_1.2,0.08064640164375306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,32,balanced,0.031370667119820915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,32,balanced,0.03150933235883713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,32,power_law_1.01,0.0353408008813858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,32,power_law_1.01,0.0356799989938736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,32,power_law_1.2,0.035334399342536925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,32,power_law_1.2,0.035411199927330016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,4,balanced,0.04308266441027323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,4,balanced,0.04783466458320618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,4,power_law_1.01,0.05722879767417908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,4,power_law_1.01,0.060601598024368285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,4,power_law_1.2,0.060192000865936277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,4,power_law_1.2,0.06711680293083191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,64,balanced,0.03150933235883713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,64,balanced,0.03190399954716364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,64,power_law_1.01,0.032518398761749265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,64,power_law_1.01,0.03284479975700379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,64,power_law_1.2,0.03292160034179688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,64,power_law_1.2,0.03331199884414673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,8,balanced,0.037434667348861694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,8,balanced,0.03753600021203359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,8,power_law_1.01,0.055206400156021115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,8,power_law_1.01,0.05538560152053833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,8,power_law_1.2,0.05470079779624939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,1,8,power_law_1.2,0.05841919779777527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,16,1,balanced,0.05793066819508871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,16,1,balanced,0.058143998185793556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,16,1,power_law_1.01,0.05672320127487183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,16,1,power_law_1.01,0.05743359923362732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,16,1,power_law_1.2,0.05626879930496216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,16,1,power_law_1.2,0.057107198238372806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,2,1,balanced,0.05603733162085215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,2,1,balanced,0.056688000758488975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,2,1,power_law_1.01,0.05432320237159729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,2,1,power_law_1.01,0.055430400371551516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,2,1,power_law_1.2,0.05428479909896851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,2,1,power_law_1.2,0.055232000350952146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,32,1,balanced,0.05603733162085215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,32,1,balanced,0.057002668579419456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,32,1,power_law_1.01,0.055078399181365964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,32,1,power_law_1.01,0.055404800176620486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,32,1,power_law_1.2,0.0549888014793396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,32,1,power_law_1.2,0.055276799201965335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,4,1,balanced,0.03551999976237615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,4,1,balanced,0.037733333806196846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,4,1,power_law_1.01,0.03861759901046753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,4,1,power_law_1.01,0.0392192006111145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,4,1,power_law_1.2,0.03837440013885498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,4,1,power_law_1.2,0.03857280015945434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,8,1,balanced,0.0643093337615331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,8,1,balanced,0.06434133152167003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,8,1,power_law_1.01,0.06684160232543945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,8,1,power_law_1.01,0.06700159907341004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,8,1,power_law_1.2,0.06629760265350342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,2688,1856,6,128,8,1,power_law_1.2,0.06639360189437866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,1,balanced,0.10307199756304423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,1,balanced,0.11920533577601115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,1,power_law_1.01,0.10096640586853027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,1,power_law_1.01,0.10243200063705445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,1,power_law_1.2,0.10195200443267823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,1,power_law_1.2,0.10443520545959473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,128,balanced,0.031343999008337654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,128,balanced,0.03169599920511246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,128,power_law_1.01,0.030099201202392577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,128,power_law_1.01,0.030432000756263733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,128,power_law_1.2,0.031014400720596313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,128,power_law_1.2,0.03139840066432953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,16,balanced,0.030853333572546642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,16,balanced,0.033402666449546814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,16,power_law_1.01,0.06861439943313599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,16,power_law_1.01,0.06963840126991272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,16,power_law_1.2,0.058323198556900026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,16,power_law_1.2,0.06423680186271667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,2,balanced,0.07388266424338023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,2,balanced,0.07612800101439159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,2,power_law_1.01,0.09525120258331299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,2,power_law_1.01,0.1028223991394043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,2,power_law_1.2,0.08020480275154114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,2,power_law_1.2,0.09755520224571228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,256,balanced,0.031317333380381264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,256,balanced,0.03158933420976003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,256,power_law_1.01,0.030239999294281006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,256,power_law_1.01,0.030899199843406677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,256,power_law_1.2,0.02959359884262085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,256,power_law_1.2,0.030451199412345885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,32,balanced,0.03145600110292435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,32,balanced,0.03366400053103765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,32,power_law_1.01,0.05115519762039185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,32,power_law_1.01,0.0516543984413147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,32,power_law_1.2,0.050374400615692136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,32,power_law_1.2,0.051532799005508424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,4,balanced,0.04821333289146423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,4,balanced,0.05219733218352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,4,power_law_1.01,0.08140159845352173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,4,power_law_1.01,0.08158720135688782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,4,power_law_1.2,0.06991999745368957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,4,power_law_1.2,0.07434239983558655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,64,balanced,0.03162133445342382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,64,balanced,0.03327466547489166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,64,power_law_1.01,0.034355199337005614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,64,power_law_1.01,0.0350847989320755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,64,power_law_1.2,0.034790399670600894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,64,power_law_1.2,0.03521920144557953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,8,balanced,0.03501333296298981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,8,balanced,0.0367999995748202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,8,power_law_1.01,0.07553279995918274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,8,power_law_1.01,0.07568640112876893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,8,power_law_1.2,0.06087039709091187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,1,8,power_law_1.2,0.06803839802742004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,16,1,balanced,0.02922133356332779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,16,1,balanced,0.029477333029111225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,16,1,power_law_1.01,0.02908160090446472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,16,1,power_law_1.01,0.02956799864768982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,16,1,power_law_1.2,0.029183998703956604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,16,1,power_law_1.2,0.029580798745155335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,2,1,balanced,0.06608533362547557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,2,1,balanced,0.0662773350874583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,2,1,power_law_1.01,0.062412798404693604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,2,1,power_law_1.01,0.072953599691391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,2,1,power_law_1.2,0.06346880197525025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,2,1,power_law_1.2,0.06372479796409607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,32,1,balanced,0.027642667293548584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,32,1,balanced,0.028394666810830433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,32,1,power_law_1.01,0.026438400149345398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,32,1,power_law_1.01,0.026521599292755126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,32,1,power_law_1.2,0.027091199159622194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,32,1,power_law_1.2,0.02736000120639801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,4,1,balanced,0.043023998538653054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,4,1,balanced,0.04354133208592733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,4,1,power_law_1.01,0.04287999868392944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,4,1,power_law_1.01,0.04355199933052063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,4,1,power_law_1.2,0.04366079866886139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,4,1,power_law_1.2,0.043699198961257936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,8,1,balanced,0.033344000577926636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,8,1,balanced,0.033610666791598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,8,1,power_law_1.01,0.034092798829078674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,8,1,power_law_1.01,0.034815999865531924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,8,1,power_law_1.2,0.03450239896774292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,3072,1536,8,256,8,1,power_law_1.2,0.03522560000419617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,1,balanced,0.2527093291282654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,1,balanced,0.2537546753883362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,1,power_law_1.01,0.16120959520339967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,1,power_law_1.01,0.16346880197525024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,1,power_law_1.2,0.18276480436325074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,1,power_law_1.2,0.19188480377197265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,2,balanced,0.17385600010553995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,2,balanced,0.18574933211008707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,2,power_law_1.01,0.11354240179061889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,2,power_law_1.01,0.13328640460968016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,2,power_law_1.2,0.136735999584198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,2,power_law_1.2,0.13957120180130006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,4,balanced,0.11199466387430827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,4,balanced,0.11313066879908244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,4,power_law_1.01,0.09536640048027038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,4,power_law_1.01,0.10076800584793091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,4,power_law_1.2,0.1053887963294983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,4,power_law_1.2,0.10940159559249878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,8,balanced,0.08770666519800822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,8,balanced,0.09453866879145305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,8,power_law_1.01,0.08561919927597046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,8,power_law_1.01,0.08609279990196228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,8,power_law_1.2,0.08589439988136291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,1,8,power_law_1.2,0.08634240031242371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,16,1,balanced,0.0365280012289683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,16,1,balanced,0.03761066744724909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,16,1,power_law_1.01,0.03223679959774017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,16,1,power_law_1.01,0.03232640027999878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,16,1,power_law_1.2,0.03086079955101013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,16,1,power_law_1.2,0.032627201080322264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,2,1,balanced,0.14668266971906027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,2,1,balanced,0.1571999986966451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,2,1,power_law_1.01,0.10232959985733033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,2,1,power_law_1.01,0.1081536054611206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,2,1,power_law_1.2,0.10613119602203369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,2,1,power_law_1.2,0.11845120191574096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,32,1,balanced,0.029450667401154835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,32,1,balanced,0.029477333029111225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,32,1,power_law_1.01,0.026662400364875792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,32,1,power_law_1.01,0.027244800329208375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,32,1,power_law_1.2,0.027116799354553224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,32,1,power_law_1.2,0.027622398734092713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,4,1,balanced,0.08418132861455281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,4,1,balanced,0.0848426620165507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,4,1,power_law_1.01,0.060236799716949466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,4,1,power_law_1.01,0.06236799955368042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,4,1,power_law_1.2,0.05922560095787048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,4,1,power_law_1.2,0.06275839805603027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,8,1,balanced,0.05730666716893514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,8,1,balanced,0.057333335280418396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,8,1,power_law_1.01,0.042828801274299624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,8,1,power_law_1.01,0.04450559914112091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,8,1,power_law_1.2,0.041331198811531064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,14336,2,8,8,1,power_law_1.2,0.0458624005317688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,1,balanced,0.13084266583124796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,1,balanced,0.13117866714795431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,1,power_law_1.01,0.12634240388870238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,1,power_law_1.01,0.12741760015487671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,1,power_law_1.2,0.12175999879837036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,1,power_law_1.2,0.12286080121994018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,128,balanced,0.03344533344109853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,128,balanced,0.03369600077470144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,128,power_law_1.01,0.03192319869995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,128,power_law_1.01,0.03247359991073608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,128,power_law_1.2,0.032025599479675294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,128,power_law_1.2,0.03213439881801605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,16,balanced,0.033887999753157295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,16,balanced,0.03532266616821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,16,power_law_1.01,0.055776000022888184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,16,power_law_1.01,0.056390398740768434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,16,power_law_1.2,0.05457280278205871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,16,power_law_1.2,0.056992000341415404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,2,balanced,0.08413867155710857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,2,balanced,0.08455466230710347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,2,power_law_1.01,0.09599999785423279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,2,power_law_1.01,0.09902719855308532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,2,power_law_1.2,0.08712319731712341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,2,power_law_1.2,0.08794879913330078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,32,balanced,0.03326933334271113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,32,balanced,0.03331733246644338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,32,power_law_1.01,0.03903360068798065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,32,power_law_1.01,0.039136001467704774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,32,power_law_1.2,0.03918719887733459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,32,power_law_1.2,0.03945600092411041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,4,balanced,0.05959466596444448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,4,balanced,0.0611413319905599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,4,power_law_1.01,0.07581440210342408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,4,power_law_1.01,0.07850880026817322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,4,power_law_1.2,0.06961920261383056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,4,power_law_1.2,0.07616639733314515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,64,balanced,0.03339199970165888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,64,balanced,0.033573334415753685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,64,power_law_1.01,0.03338240087032318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,64,power_law_1.01,0.033632001280784606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,64,power_law_1.2,0.03226880133152008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,64,power_law_1.2,0.03404799997806549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,8,balanced,0.03980266551176707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,8,balanced,0.04205333193143209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,8,power_law_1.01,0.06330239772796631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,8,power_law_1.01,0.06522240042686463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,8,power_law_1.2,0.06219519972801209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,1,8,power_law_1.2,0.06551039814949036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,16,1,balanced,0.03148266673088074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,16,1,balanced,0.03260799994071325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,16,1,power_law_1.01,0.034246399998664856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,16,1,power_law_1.01,0.03501439988613129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,16,1,power_law_1.2,0.034169599413871765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,16,1,power_law_1.2,0.03434880077838898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,2,1,balanced,0.07668800155321757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,2,1,balanced,0.0792906681696574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,2,1,power_law_1.01,0.07527679800987244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,2,1,power_law_1.01,0.0753600001335144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,2,1,power_law_1.2,0.07156479954719544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,2,1,power_law_1.2,0.07167360186576843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,32,1,balanced,0.031157332162062328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,32,1,balanced,0.031258667508761086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,32,1,power_law_1.01,0.02980479896068573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,32,1,power_law_1.01,0.02996479868888855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,32,1,power_law_1.2,0.02990719974040985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,32,1,power_law_1.2,0.03022719919681549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,4,1,balanced,0.05235733091831207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,4,1,balanced,0.054144000013669334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,4,1,power_law_1.01,0.05144320130348205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,4,1,power_law_1.01,0.05146239995956421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,4,1,power_law_1.2,0.049721598625183105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,4,1,power_law_1.2,0.05055999755859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,8,1,balanced,0.03880000114440918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,8,1,balanced,0.03956799954175949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,8,1,power_law_1.01,0.039647999405860904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,8,1,power_law_1.01,0.039743998646736146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,8,1,power_law_1.2,0.03933440148830414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,1536,8,128,8,1,power_law_1.2,0.039743998646736146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,1,balanced,0.4787626663843791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,1,balanced,0.47888533274332684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,1,power_law_1.01,0.4766719818115234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,1,power_law_1.01,0.4770559787750244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,1,power_law_1.2,0.47287678718566895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,1,power_law_1.2,0.47687039375305174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,128,balanced,0.03748800108830134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,128,balanced,0.03949866692225138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,128,power_law_1.01,0.05735039710998535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,128,power_law_1.01,0.05847039818763733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,128,power_law_1.2,0.05786240100860596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,128,power_law_1.2,0.05799040198326111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,16,balanced,0.07945066690444946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,16,balanced,0.07964266836643219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,16,power_law_1.01,0.19317760467529296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,16,power_law_1.01,0.2040191888809204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,16,power_law_1.2,0.19242240190505983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,16,power_law_1.2,0.2033344030380249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,2,balanced,0.26895999908447266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,2,balanced,0.26922667026519775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,2,power_law_1.01,0.316595196723938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,2,power_law_1.01,0.3447103977203369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,2,power_law_1.2,0.31943039894104003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,2,power_law_1.2,0.3503551959991455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,256,balanced,0.0378506655494372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,256,balanced,0.03799466788768768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,256,power_law_1.01,0.04343680143356323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,256,power_law_1.01,0.04348799884319306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,256,power_law_1.2,0.04280959963798523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,256,power_law_1.2,0.043635201454162595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,32,balanced,0.06309333443641663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,32,balanced,0.0643039991458257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,32,power_law_1.01,0.1331455945968628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,32,power_law_1.01,0.1332479953765869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,32,power_law_1.2,0.132915198802948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,32,power_law_1.2,0.13293440341949464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,4,balanced,0.16563733418782553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,4,balanced,0.1678826610247294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,4,power_law_1.01,0.2736768007278442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,4,power_law_1.01,0.2752255916595459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,4,power_law_1.2,0.27317759990692136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,4,power_law_1.2,0.28012800216674805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,64,balanced,0.05384000142415365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,64,balanced,0.05562133093674978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,64,power_law_1.01,0.07697920203208923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,64,power_law_1.01,0.0780672013759613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,64,power_law_1.2,0.07706239819526672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,64,power_law_1.2,0.07720959782600403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,8,balanced,0.1188266674677531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,8,balanced,0.12081600228945415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,8,power_law_1.01,0.22037119865417482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,8,power_law_1.01,0.22704639434814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,8,power_law_1.2,0.21608319282531738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,1,8,power_law_1.2,0.23518719673156738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,16,1,balanced,0.24763200680414835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,16,1,balanced,0.24893865982691446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,16,1,power_law_1.01,0.24732799530029298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,16,1,power_law_1.01,0.2477952003479004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,16,1,power_law_1.2,0.24769918918609618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,16,1,power_law_1.2,0.24777600765228272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,2,1,balanced,0.2571573257446289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,2,1,balanced,0.25759466489156085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,2,1,power_law_1.01,0.2556864023208618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,2,1,power_law_1.01,0.25715839862823486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,2,1,power_law_1.2,0.25552000999450686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,2,1,power_law_1.2,0.2564608097076416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,32,1,balanced,0.20748267571131387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,32,1,balanced,0.20760534207026163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,32,1,power_law_1.01,0.2103872060775757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,32,1,power_law_1.01,0.21057920455932616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,32,1,power_law_1.2,0.21009280681610107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,32,1,power_law_1.2,0.21068160533905028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,4,1,balanced,0.1513813336690267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,4,1,balanced,0.15433067083358765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,4,1,power_law_1.01,0.1509376049041748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,4,1,power_law_1.01,0.15141760110855101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,4,1,power_law_1.2,0.14996479749679564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,4,1,power_law_1.2,0.15098240375518798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,8,1,balanced,0.10288000106811523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,8,1,balanced,0.10843200484911601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,8,1,power_law_1.01,0.09853439927101135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,8,1,power_law_1.01,0.0986240029335022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,8,1,power_law_1.2,0.09894400238990783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,4096,2688,22,512,8,1,power_law_1.2,0.09943040013313294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,1,balanced,0.43351467450459796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,1,balanced,0.43410666783650714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,1,power_law_1.01,0.26794240474700926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,1,power_law_1.01,0.2704960107803345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,1,power_law_1.2,0.27388160228729247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,1,power_law_1.2,0.32118399143218995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,2,balanced,0.24722667535146078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,2,balanced,0.2696533401807149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,2,power_law_1.01,0.17904000282287597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,2,power_law_1.01,0.208076810836792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,2,power_law_1.2,0.16219520568847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,2,power_law_1.2,0.19604480266571045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,4,balanced,0.1655946671962738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,4,balanced,0.1701493263244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,4,power_law_1.01,0.1327232003211975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,4,power_law_1.01,0.13564800024032592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,4,power_law_1.2,0.1343808054924011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,4,power_law_1.2,0.14229120016098024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,8,balanced,0.11094933748245239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,8,balanced,0.11528000235557556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,8,power_law_1.01,0.11077760457992554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,8,power_law_1.01,0.11260800361633301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,8,power_law_1.2,0.11043839454650879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,1,8,power_law_1.2,0.11175040006637574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,16,1,balanced,0.056234667698542275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,16,1,balanced,0.058378666639328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,16,1,power_law_1.01,0.04152320027351379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,16,1,power_law_1.01,0.043296000361442565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,16,1,power_law_1.2,0.04291200041770935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,16,1,power_law_1.2,0.04360319972038269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,2,1,balanced,0.2301973303159078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,2,1,balanced,0.24813334147135416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,2,1,power_law_1.01,0.14582400321960448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,2,1,power_law_1.01,0.15688320398330688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,2,1,power_law_1.2,0.154367995262146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,2,1,power_law_1.2,0.154476797580719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,32,1,balanced,0.03562133262554804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,32,1,balanced,0.03707200040419897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,32,1,power_law_1.01,0.034835198521614076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,32,1,power_law_1.01,0.035308799147605895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,32,1,power_law_1.2,0.03389439880847931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,32,1,power_law_1.2,0.03410559892654419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,4,1,balanced,0.1322879989941915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,4,1,balanced,0.14310399691263834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,4,1,power_law_1.01,0.08461440205574036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,4,1,power_law_1.01,0.08817279934883118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,4,1,power_law_1.2,0.0880895972251892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,4,1,power_law_1.2,0.10686719417572021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,8,1,balanced,0.08483200271924336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,8,1,balanced,0.08602666854858398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,8,1,power_law_1.01,0.056531202793121335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,8,1,power_law_1.01,0.06392319798469544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,8,1,power_law_1.2,0.0585919976234436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,16384,2,8,8,1,power_law_1.2,0.06695039868354798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,1,balanced,0.22540799776713052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,1,balanced,0.24066666762034097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,1,power_law_1.01,0.22512640953063964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,1,power_law_1.01,0.22847359180450438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,1,power_law_1.2,0.22775681018829347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,1,power_law_1.2,0.22889599800109864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,128,balanced,0.03743999948104223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,128,balanced,0.03766933331886927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,128,power_law_1.01,0.04314880073070526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,128,power_law_1.01,0.04348160028457641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,128,power_law_1.2,0.04320639967918396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,128,power_law_1.2,0.043910399079322815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,16,balanced,0.045552000403404236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,16,balanced,0.047781333327293396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,16,power_law_1.01,0.1347391963005066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,16,power_law_1.01,0.1379520058631897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,16,power_law_1.2,0.13207039833068848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,16,power_law_1.2,0.1332352042198181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,2,balanced,0.1395039955774943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,2,balanced,0.14131200313568115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,2,power_law_1.01,0.18659839630126954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,2,power_law_1.01,0.20172159671783446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,2,power_law_1.2,0.18232959508895874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,2,power_law_1.2,0.18624000549316405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,256,balanced,0.03835200021664301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,256,balanced,0.039749334255854286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,256,power_law_1.01,0.03656319975852966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,256,power_law_1.01,0.036575999855995175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,256,power_law_1.2,0.036934399604797365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,32,balanced,0.03772266705830892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,32,balanced,0.03982399900754293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,32,power_law_1.01,0.08180480003356934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,32,power_law_1.01,0.0831167995929718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,32,power_law_1.2,0.08273280262947083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,32,power_law_1.2,0.08481280207633972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,4,balanced,0.08283199866612752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,4,balanced,0.09504533807436626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,4,power_law_1.01,0.169376003742218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,4,power_law_1.01,0.17526400089263916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,4,power_law_1.2,0.14396159648895263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,4,power_law_1.2,0.16394879817962646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,64,balanced,0.039477333426475525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,64,balanced,0.03959999978542328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,64,power_law_1.01,0.06252800226211548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,64,power_law_1.01,0.06364799737930298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,64,power_law_1.2,0.061817598342895505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,64,power_law_1.2,0.06306560039520263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,8,balanced,0.06378666559855144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,8,balanced,0.06448533137639363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,8,power_law_1.01,0.15242880582809448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,8,power_law_1.01,0.16241919994354248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,8,power_law_1.2,0.1305343985557556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,1,8,power_law_1.2,0.1530176043510437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,16,1,balanced,0.04240000247955322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,16,1,balanced,0.043178667624791466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,16,1,power_law_1.01,0.04433920085430145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,16,1,power_law_1.01,0.04519039988517761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,16,1,power_law_1.2,0.044838398694992065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,16,1,power_law_1.2,0.04496000111103058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,2,1,balanced,0.12787200013796488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,2,1,balanced,0.1300320029258728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,2,1,power_law_1.01,0.1276800036430359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,2,1,power_law_1.01,0.12829439640045165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,2,1,power_law_1.2,0.12699520587921143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,2,1,power_law_1.2,0.12702080011367797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,32,1,balanced,0.03813866774241129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,32,1,balanced,0.03945599993069967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,32,1,power_law_1.01,0.04177280068397522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,32,1,power_law_1.01,0.042131200432777405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,32,1,power_law_1.2,0.04245119988918304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,32,1,power_law_1.2,0.04289279878139496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,4,1,balanced,0.07656000057856242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,4,1,balanced,0.07820266485214233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,4,1,power_law_1.01,0.07623040080070495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,4,1,power_law_1.01,0.07719039916992188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,4,1,power_law_1.2,0.0753920018672943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,4,1,power_law_1.2,0.07581440210342408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,8,1,balanced,0.05596266686916351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,8,1,balanced,0.0565280020236969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,8,1,power_law_1.01,0.05415679812431336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,8,1,power_law_1.01,0.05488640069961548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,8,1,power_law_1.2,0.054016000032424925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2048,8,256,8,1,power_law_1.2,0.0543615996837616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,1,balanced,0.2690933346748352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,1,balanced,0.271397332350413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,1,power_law_1.01,0.2691839933395386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,1,power_law_1.01,0.2696448087692261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,1,power_law_1.2,0.26765439510345457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,1,power_law_1.2,0.26956160068511964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,16,balanced,0.04969066878159841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,16,balanced,0.04993066688378652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,16,power_law_1.01,0.10964479446411132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,16,power_law_1.01,0.1121664047241211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,16,power_law_1.2,0.11255680322647095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,16,power_law_1.2,0.11749759912490845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,2,balanced,0.16707199811935425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,2,balanced,0.16951467593510947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,2,power_law_1.01,0.18524160385131835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,2,power_law_1.01,0.19115519523620605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,2,power_law_1.2,0.19090559482574462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,2,power_law_1.2,0.19925119876861572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,32,balanced,0.039488000174363456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,32,balanced,0.03961066653331121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,32,power_law_1.01,0.07195519804954528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,32,power_law_1.01,0.07246080040931702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,32,power_law_1.2,0.07153919935226441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,32,power_law_1.2,0.0729088008403778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,4,balanced,0.09927999973297119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,4,balanced,0.11217066645622253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,4,power_law_1.01,0.1525887966156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,4,power_law_1.01,0.15765759944915772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,4,power_law_1.2,0.16390399932861327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,4,power_law_1.2,0.16590720415115356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,8,balanced,0.06833600004514058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,8,balanced,0.06846933563550313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,8,power_law_1.01,0.11911040544509888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,8,power_law_1.01,0.14529279470443726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,8,power_law_1.2,0.1489856004714966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,1,8,power_law_1.2,0.1496832013130188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,16,1,balanced,0.04757866760094961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,16,1,balanced,0.049925332268079124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,16,1,power_law_1.01,0.05074560046195984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,16,1,power_law_1.01,0.05095679759979248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,16,1,power_law_1.2,0.049491199851036075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,16,1,power_law_1.2,0.04991360008716583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,2,1,balanced,0.15458133816719055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,2,1,balanced,0.15853866934776306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,2,1,power_law_1.01,0.15560959577560424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,2,1,power_law_1.01,0.1560639977455139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,2,1,power_law_1.2,0.1536064028739929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,2,1,power_law_1.2,0.15712640285491944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,32,1,balanced,0.039306665460268654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,32,1,balanced,0.041802664597829185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,32,1,power_law_1.01,0.043635201454162595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,32,1,power_law_1.01,0.04371199905872345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,32,1,power_law_1.2,0.04382080137729645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,32,1,power_law_1.2,0.043942400813102724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,4,1,balanced,0.09034666419029236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,4,1,balanced,0.09160000085830688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,4,1,power_law_1.01,0.08922240138053894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,4,1,power_law_1.01,0.0911616027355194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,4,1,power_law_1.2,0.0856383979320526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,4,1,power_law_1.2,0.08599680066108703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,8,1,balanced,0.06451733410358429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,8,1,balanced,0.06740266581376393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,8,1,power_law_1.01,0.06312959790229797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,8,1,power_law_1.01,0.06323199868202209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,8,1,power_law_1.2,0.06287999749183655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,6144,2560,8,160,8,1,power_law_1.2,0.06291199922561645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,1,balanced,0.25408534208933514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,1,balanced,0.25621867179870605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,1,power_law_1.01,0.25530879497528075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,1,power_law_1.01,0.25603199005126953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,1,power_law_1.2,0.2538367986679077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,1,power_law_1.2,0.25569279193878175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,128,balanced,0.04162133236726125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,128,balanced,0.04191466669241587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,128,power_law_1.01,0.04785920083522797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,128,power_law_1.01,0.048716801404953006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,128,power_law_1.2,0.04647679924964905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,128,power_law_1.2,0.04886400103569031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,16,balanced,0.04778666794300079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,16,balanced,0.0499839981396993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,16,power_law_1.01,0.14958720207214354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,16,power_law_1.01,0.14968960285186766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,16,power_law_1.2,0.13339519500732422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,16,power_law_1.2,0.14264960289001466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,2,balanced,0.1507306694984436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,2,balanced,0.1509119967619578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,2,power_law_1.01,0.21867520809173585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,2,power_law_1.01,0.226476788520813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,2,power_law_1.2,0.19742079973220825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,2,power_law_1.2,0.20891520977020264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,256,balanced,0.04165333261092504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,256,balanced,0.04200533529122671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,256,power_law_1.01,0.04042240083217621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,256,power_law_1.01,0.04095999896526337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,256,power_law_1.2,0.0398144006729126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,256,power_law_1.2,0.04022400081157684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,32,balanced,0.04173333446184794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,32,balanced,0.04178133110205332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,32,power_law_1.01,0.09194239974021912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,32,power_law_1.01,0.0926912009716034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,32,power_law_1.2,0.09127680063247681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,32,power_law_1.2,0.09132800102233887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,4,balanced,0.10013866424560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,4,balanced,0.12528000275293985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,4,power_law_1.01,0.1913151979446411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,4,power_law_1.01,0.20020480155944825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,4,power_law_1.2,0.1621567964553833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,4,power_law_1.2,0.1751871943473816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,64,balanced,0.04145599901676178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,64,balanced,0.04148799926042557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,64,power_law_1.01,0.06759039759635925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,64,power_law_1.01,0.06799359917640686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,64,power_law_1.2,0.06694399714469909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,64,power_law_1.2,0.06710399985313416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,8,balanced,0.07454933226108551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,8,balanced,0.08444799979527791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,8,power_law_1.01,0.1884735941886902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,8,power_law_1.01,0.19687680006027222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,8,power_law_1.2,0.1495743989944458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,1,8,power_law_1.2,0.1650431990623474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,16,1,balanced,0.04765866696834564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,16,1,balanced,0.049626668294270836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,16,1,power_law_1.01,0.04872959852218628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,16,1,power_law_1.01,0.049107199907302855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,16,1,power_law_1.2,0.049619200825691226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,16,1,power_law_1.2,0.049932798743247984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,2,1,balanced,0.1434506674607595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,2,1,balanced,0.1456000010172526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,2,1,power_law_1.01,0.14194560050964355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,2,1,power_law_1.01,0.1427135944366455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,2,1,power_law_1.2,0.14154239892959594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,2,1,power_law_1.2,0.14185600280761718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,32,1,balanced,0.04135466615358988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,32,1,balanced,0.04141866664091746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,32,1,power_law_1.01,0.0453247994184494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,32,1,power_law_1.01,0.0471807986497879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,32,1,power_law_1.2,0.04597119987010956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,32,1,power_law_1.2,0.047417598962783816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,4,1,balanced,0.08522666494051616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,4,1,balanced,0.08674133817354839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,4,1,power_law_1.01,0.08528000116348267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,4,1,power_law_1.01,0.09011840224266052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,4,1,power_law_1.2,0.08490239977836608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,4,1,power_law_1.2,0.08720639944076539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,8,1,balanced,0.06378666559855144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,8,1,balanced,0.06625600159168243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,8,1,power_law_1.01,0.060652798414230345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,8,1,power_law_1.01,0.06161919832229614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,8,1,power_law_1.2,0.060236799716949466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,256,8,1,power_law_1.2,0.06114559769630432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,1,balanced,0.25845867395401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,1,balanced,0.2592693368593852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,1,power_law_1.01,0.2538815975189209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,1,power_law_1.01,0.2575167894363403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,1,power_law_1.2,0.2532480001449585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,1,power_law_1.2,0.25522561073303224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,128,balanced,0.04104000081618627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,128,balanced,0.041850666205088295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,128,power_law_1.01,0.0593280017375946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,128,power_law_1.01,0.05953279733657837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,128,power_law_1.2,0.05941759943962097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,128,power_law_1.2,0.059622400999069215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,16,balanced,0.04799466828505198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,16,balanced,0.0480373352766037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,16,power_law_1.01,0.20508160591125488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,16,power_law_1.01,0.20568320751190186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,16,power_law_1.2,0.18878719806671143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,16,power_law_1.2,0.2003391981124878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,2,balanced,0.1504586637020111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,2,balanced,0.15125333269437155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,2,power_law_1.01,0.259334397315979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,2,power_law_1.01,0.26201601028442384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,2,power_law_1.2,0.22077438831329346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,2,power_law_1.2,0.24009599685668945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,32,balanced,0.04119466741879781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,32,balanced,0.04146133363246918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,32,power_law_1.01,0.13418879508972167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,32,power_law_1.01,0.13598079681396485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,32,power_law_1.2,0.13557759523391724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,32,power_law_1.2,0.13687679767608643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,4,balanced,0.09397332866986592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,4,balanced,0.09469866752624512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,4,power_law_1.01,0.26172800064086915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,4,power_law_1.01,0.26211841106414796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,4,power_law_1.2,0.20179200172424316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,4,power_law_1.2,0.20755839347839355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,64,balanced,0.04165333261092504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,64,balanced,0.04185600082079569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,64,power_law_1.01,0.07921919822692872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,64,power_law_1.01,0.07933440208435058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,64,power_law_1.2,0.07901440262794494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,64,power_law_1.2,0.07909759879112244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,8,balanced,0.06691733499368031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,8,balanced,0.06810666620731354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,8,power_law_1.01,0.26155519485473633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,8,power_law_1.01,0.2636735916137695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,8,power_law_1.2,0.20195839405059815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,1,8,power_law_1.2,0.20584959983825685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,16,1,balanced,0.047839999198913574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,16,1,balanced,0.04979733129342397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,16,1,power_law_1.01,0.043296000361442565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,16,1,power_law_1.01,0.04467839896678925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,16,1,power_law_1.2,0.04836480021476745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,16,1,power_law_1.2,0.04891520142555237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,2,1,balanced,0.143477330605189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,2,1,balanced,0.1458293298880259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,2,1,power_law_1.01,0.1428096055984497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,2,1,power_law_1.01,0.1482432007789612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,2,1,power_law_1.2,0.14277119636535646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,2,1,power_law_1.2,0.14385279417037963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,32,1,balanced,0.040021332601706185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,32,1,balanced,0.046096002062161766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,32,1,power_law_1.01,0.0390720009803772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,32,1,power_law_1.01,0.039705601334571836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,32,1,power_law_1.2,0.0449535995721817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,32,1,power_law_1.2,0.045459198951721194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,4,1,balanced,0.08541867136955261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,4,1,balanced,0.0869706670443217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,4,1,power_law_1.01,0.084307199716568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,4,1,power_law_1.01,0.08526719808578491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,4,1,power_law_1.2,0.08476160168647766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,4,1,power_law_1.2,0.08486400246620178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,8,1,balanced,0.06213866670926412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,8,1,balanced,0.0634933312733968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,8,1,power_law_1.01,0.06108800172805786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,8,1,power_law_1.01,0.06172159910202026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,8,1,power_law_1.2,0.06101760268211365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4,7168,2048,8,384,8,1,power_law_1.2,0.061292797327041626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,1,balanced,0.43773333231608075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,1,balanced,0.4397546847661336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,1,power_law_1.01,0.49353599548339844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,1,power_law_1.01,0.49482879638671873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,1,power_law_1.2,0.5036928176879882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,1,power_law_1.2,0.5074751853942872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,128,balanced,0.25918400287628174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,128,balanced,0.25945067405700684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,128,power_law_1.01,0.26860799789428713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,128,power_law_1.01,0.2719167947769165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,128,power_law_1.2,0.2751296043395996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,128,power_law_1.2,0.278112006187439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,16,balanced,0.269269327322642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,16,balanced,0.2701866626739502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,16,power_law_1.01,0.2880768060684204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,16,power_law_1.01,0.29002881050109863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,16,power_law_1.2,0.28896639347076414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,16,power_law_1.2,0.29687678813934326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,2,balanced,0.36980267365773517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,2,balanced,0.37221864859263104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,2,power_law_1.01,0.41242241859436035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,2,power_law_1.01,0.41481599807739256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,2,power_law_1.2,0.41728639602661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,2,power_law_1.2,0.4196800231933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,32,balanced,0.2635786732037862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,32,balanced,0.26445333162943524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,32,power_law_1.01,0.2752959966659546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,32,power_law_1.01,0.27980799674987794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,32,power_law_1.2,0.28624639511108396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,32,power_law_1.2,0.2863039970397949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,4,balanced,0.31169066826502484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,4,balanced,0.31436266501744586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,4,power_law_1.01,0.3419519901275635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,4,power_law_1.01,0.3434751987457275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,4,power_law_1.2,0.3465536117553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,4,power_law_1.2,0.3509376049041748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,64,balanced,0.26125333706537884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,64,balanced,0.26262933015823364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,64,power_law_1.01,0.27180800437927244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,64,power_law_1.01,0.27280640602111816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,64,power_law_1.2,0.281439995765686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,64,power_law_1.2,0.28405759334564207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,8,balanced,0.28379732370376587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,8,balanced,0.2852693398793538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,8,power_law_1.01,0.3047231912612915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,8,power_law_1.01,0.30524799823760984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,8,power_law_1.2,0.31371519565582273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,1,8,power_law_1.2,0.32032639980316163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,2,1,balanced,0.3155626654624939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,2,1,balanced,0.3162720004717509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,2,1,power_law_1.01,0.34917759895324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,2,1,power_law_1.01,0.34970879554748535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,2,1,power_law_1.2,0.3542975902557373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,2,1,power_law_1.2,0.35767040252685545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,4,1,balanced,0.26525866985321045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,4,1,balanced,0.26531734069188434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,4,1,power_law_1.01,0.29171841144561766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,4,1,power_law_1.01,0.29341440200805663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,4,1,power_law_1.2,0.2939199924468994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2048,768,8,128,4,1,power_law_1.2,0.2966399908065796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,1,balanced,0.8704319794972738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,1,balanced,0.8827199935913086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,1,power_law_1.01,0.931833553314209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,1,power_law_1.01,0.9348416328430176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,1,power_law_1.2,0.946713638305664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,1,power_law_1.2,0.9505023956298828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,128,balanced,0.33453865845998126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,128,balanced,0.33530668417612713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,128,power_law_1.01,0.35359361171722414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,128,power_law_1.01,0.3543423891067505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,128,power_law_1.2,0.37445759773254395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,128,power_law_1.2,0.38668160438537597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,16,balanced,0.36852800846099854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,16,balanced,0.3712426821390788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,16,power_law_1.01,0.39619200229644774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,16,power_law_1.01,0.4046016216278076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,16,power_law_1.2,0.4124288082122803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,16,power_law_1.2,0.4238272190093994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,2,balanced,0.6264906724294027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,2,balanced,0.6277173360188802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,2,power_law_1.01,0.6722367763519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,2,power_law_1.01,0.6803840160369873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,2,power_law_1.2,0.6798143863677979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,2,power_law_1.2,0.6803967952728271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,32,balanced,0.3497013250986735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,32,balanced,0.35070931911468506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,32,power_law_1.01,0.37246720790863036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,32,power_law_1.01,0.3738687992095947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,32,power_law_1.2,0.39239039421081545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,32,power_law_1.2,0.39674880504608157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,4,balanced,0.4835840066274007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,4,balanced,0.48527467250823975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,4,power_law_1.01,0.5179967880249023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,4,power_law_1.01,0.5314688205718994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,4,power_law_1.2,0.5370495796203614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,4,power_law_1.2,0.5382143974304199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,64,balanced,0.3384586572647095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,64,balanced,0.3385546604792277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,64,power_law_1.01,0.3588992118835449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,64,power_law_1.01,0.36785919666290284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,64,power_law_1.2,0.3826688051223755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,64,power_law_1.2,0.38537600040435793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,8,balanced,0.40811200936635333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,8,balanced,0.41050668557484943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,8,power_law_1.01,0.43973121643066404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,8,power_law_1.01,0.4434368133544922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,8,power_law_1.2,0.44990081787109376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,1,8,power_law_1.2,0.47727360725402834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,16,1,balanced,1.5561280250549316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,16,1,balanced,1.5615733464558919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,16,1,power_law_1.01,1.6296512603759765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,16,1,power_law_1.01,1.6765504837036134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,16,1,power_law_1.2,1.688844871520996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,16,1,power_law_1.2,1.693395233154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,2,1,balanced,0.5566773414611816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,2,1,balanced,0.5593066612879435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,2,1,power_law_1.01,0.5831999778747559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,2,1,power_law_1.01,0.5860799789428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,2,1,power_law_1.2,0.598041582107544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,2,1,power_law_1.2,0.599187183380127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,32,1,balanced,1.3537227312723796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,32,1,balanced,1.3537386258443196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,32,1,power_law_1.01,1.4638784408569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,32,1,power_law_1.01,1.4657471656799317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,32,1,power_law_1.2,1.4867775917053223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,32,1,power_law_1.2,1.4920512199401856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,4,1,balanced,0.3957226673762004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,4,1,balanced,0.3957333167394002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,4,1,power_law_1.01,0.41858558654785155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,4,1,power_law_1.01,0.4210815906524658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,4,1,power_law_1.2,0.42298240661621095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,4,1,power_law_1.2,0.42500481605529783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,8,1,balanced,2.0921972592671714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,8,1,balanced,2.108026663462321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,8,1,power_law_1.01,2.1462080001831056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,8,1,power_law_1.01,2.2588415145874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,8,1,power_law_1.2,2.275200080871582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,2688,1856,6,128,8,1,power_law_1.2,2.3247615814208986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,1,balanced,1.0517280101776123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,1,balanced,1.0547626813252766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,1,power_law_1.01,1.3038911819458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,1,power_law_1.01,1.3131135940551757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,1,power_law_1.2,1.350175952911377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,1,power_law_1.2,1.3557503700256348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,128,balanced,0.40371731917063397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,128,balanced,0.4055146773656209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,128,power_law_1.01,0.4249407768249512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,128,power_law_1.01,0.4289663791656494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,128,power_law_1.2,0.4359488010406494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,128,power_law_1.2,0.44272642135620116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,16,balanced,0.4437386592229207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,16,balanced,0.44492268562316895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,16,power_law_1.01,0.4885568141937256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,16,power_law_1.01,0.492793607711792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,16,power_law_1.2,0.5008448123931885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,16,power_law_1.2,0.5030784130096435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,2,balanced,0.7593653202056885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,2,balanced,0.7602880001068115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,2,power_law_1.01,0.8994048118591309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,2,power_law_1.01,0.9000127792358399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,2,power_law_1.2,0.9243391990661621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,2,power_law_1.2,0.9473088264465332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,256,balanced,0.40322665373484295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,256,balanced,0.4041066567103068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,256,power_law_1.01,0.41633920669555663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,256,power_law_1.01,0.4174079895019531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,256,power_law_1.2,0.4274623870849609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,256,power_law_1.2,0.4298880100250244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,32,balanced,0.4193439881006877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,32,balanced,0.41997865835825604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,32,power_law_1.01,0.44976000785827636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,32,power_law_1.01,0.4544640064239502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,32,power_law_1.2,0.4660927772521973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,32,power_law_1.2,0.4663104057312012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,4,balanced,0.587061325709025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,4,balanced,0.5874346494674683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,4,power_law_1.01,0.6643455982208252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,4,power_law_1.01,0.6732672214508056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,4,power_law_1.2,0.681606388092041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,4,power_law_1.2,0.7021632194519043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,64,balanced,0.4073439836502075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,64,balanced,0.4082080125808716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,64,power_law_1.01,0.4320000171661377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,64,power_law_1.01,0.43452157974243166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,64,power_law_1.2,0.44919681549072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,64,power_law_1.2,0.4516160011291504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,8,balanced,0.4922826687494914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,8,balanced,0.49531201521555585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,8,power_law_1.01,0.5465919971466064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,8,power_law_1.01,0.5503680229187011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,8,power_law_1.2,0.5652480125427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,1,8,power_law_1.2,0.572979211807251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,16,1,balanced,0.3370986779530843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,16,1,balanced,0.3380959828694661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,16,1,power_law_1.01,0.3953536033630371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,16,1,power_law_1.01,0.39560320377349856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,16,1,power_law_1.2,0.40955519676208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,16,1,power_law_1.2,0.409606409072876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,2,1,balanced,0.6663626829783121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,2,1,balanced,0.6675626436869303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,2,1,power_law_1.01,0.804633617401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,2,1,power_law_1.01,0.8120256423950195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,2,1,power_law_1.2,0.8345727920532227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,2,1,power_law_1.2,0.8375424385070801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,32,1,balanced,0.31401065985361737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,32,1,balanced,0.31496532758076984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,32,1,power_law_1.01,0.3702336072921753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,32,1,power_law_1.01,0.3714047908782959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,32,1,power_law_1.2,0.3772160053253174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,32,1,power_law_1.2,0.37781760692596433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,4,1,balanced,0.46838398774464923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,4,1,balanced,0.46889599164326984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,4,1,power_law_1.01,0.5552896022796631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,4,1,power_law_1.01,0.5582592010498046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,4,1,power_law_1.2,0.5732863903045654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,4,1,power_law_1.2,0.575929594039917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,8,1,balanced,0.38311465581258136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,8,1,balanced,0.383568008740743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,8,1,power_law_1.01,0.45250558853149414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,8,1,power_law_1.01,0.45361919403076173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,8,1,power_law_1.2,0.46202878952026366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,3072,1536,8,256,8,1,power_law_1.2,0.46273279190063477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,1,balanced,1.8245867093404133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,1,balanced,1.862661361694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,1,power_law_1.01,1.9158016204833985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,1,power_law_1.01,1.9557567596435548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,1,power_law_1.2,1.9321664810180663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,1,power_law_1.2,1.9478464126586914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,2,balanced,1.1927680174509685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,2,balanced,1.1932053565979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,2,power_law_1.01,1.4441023826599122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,2,power_law_1.01,1.4613568305969238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,2,power_law_1.2,1.4430272102355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,2,power_law_1.2,1.5008959770202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,4,balanced,0.8454133669535319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,4,balanced,0.8528532981872559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,4,power_law_1.01,1.1011263847351074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,4,power_law_1.01,1.3298687934875488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,4,power_law_1.2,1.1717184066772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,4,power_law_1.2,1.1943296432495116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,8,balanced,0.6830879847208658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,8,balanced,0.6846506595611572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,8,power_law_1.01,1.1857088088989258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,8,power_law_1.01,1.1865471839904784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,8,power_law_1.2,1.1436736106872558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,1,8,power_law_1.2,1.1884032249450684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,16,1,balanced,0.22461867332458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,16,1,balanced,0.22524267435073853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,16,1,power_law_1.01,0.22698240280151366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,16,1,power_law_1.01,0.2274303913116455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,16,1,power_law_1.2,0.22602241039276122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,16,1,power_law_1.2,0.22910718917846679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,2,1,balanced,0.9504853089650472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,2,1,balanced,0.9541599750518799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,2,1,power_law_1.01,1.0016063690185546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,2,1,power_law_1.01,1.0279423713684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,2,1,power_law_1.2,0.9958463668823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,2,1,power_law_1.2,1.0027968406677246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,32,1,balanced,0.17084266742070517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,32,1,balanced,0.17151999473571777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,32,1,power_law_1.01,0.1762112021446228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,32,1,power_law_1.01,0.17779200077056884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,32,1,power_law_1.2,0.17804160118103027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,32,1,power_law_1.2,0.18009599447250366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,4,1,balanced,0.5180746714274088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,4,1,balanced,0.5320373376210531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,4,1,power_law_1.01,0.5430463790893555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,4,1,power_law_1.01,0.5479551792144776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,4,1,power_law_1.2,0.538265609741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,4,1,power_law_1.2,0.544051218032837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,8,1,balanced,0.31996800502141315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,8,1,balanced,0.32344533999760944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,8,1,power_law_1.01,0.3259455919265747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,8,1,power_law_1.01,0.3321216106414795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,8,1,power_law_1.2,0.3321280002593994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,14336,2,8,8,1,power_law_1.2,0.33562240600585935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,1,balanced,1.1021493275960286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,1,balanced,1.1212480068206787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,1,power_law_1.01,1.289958381652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,1,power_law_1.01,1.2934207916259766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,1,power_law_1.2,1.3171775817871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,1,power_law_1.2,1.3175935745239258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,128,balanced,0.4280053377151489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,128,balanced,0.42815999190012616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,128,power_law_1.01,0.45863680839538573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,128,power_law_1.01,0.4649087905883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,128,power_law_1.2,0.4861311912536621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,128,power_law_1.2,0.4897280216217041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,16,balanced,0.46697600682576496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,16,balanced,0.46825067202250165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,16,power_law_1.01,0.523308801651001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,16,power_law_1.01,0.5273280143737793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,16,power_law_1.2,0.5490303993225097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,16,power_law_1.2,0.5738304138183594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,2,balanced,0.800544023513794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,2,balanced,0.8039147059122721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,2,power_law_1.01,0.9477503776550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,2,power_law_1.01,0.9692095756530762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,2,power_law_1.2,0.9492416381835938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,2,power_law_1.2,0.9835776329040528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,32,balanced,0.4435253143310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,32,balanced,0.4463466803232829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,32,power_law_1.01,0.4876992225646973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,32,power_law_1.01,0.4987071990966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,32,power_law_1.2,0.5070400238037109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,32,power_law_1.2,0.5200319766998291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,4,balanced,0.6159893274307251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,4,balanced,0.6172159910202026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,4,power_law_1.01,0.7024127960205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,4,power_law_1.01,0.7276351928710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,4,power_law_1.2,0.7285952091217041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,4,power_law_1.2,0.7562623977661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,64,balanced,0.43086401621500653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,64,balanced,0.43244266510009766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,64,power_law_1.01,0.4808063983917236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,64,power_law_1.01,0.4859327793121338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,64,power_law_1.2,0.48900480270385743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,64,power_law_1.2,0.49873919486999513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,8,balanced,0.5161546468734741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,8,balanced,0.5196373462677002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,8,power_law_1.01,0.5812992095947266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,8,power_law_1.01,0.5947199821472168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,8,power_law_1.2,0.6045631885528564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,1,8,power_law_1.2,0.6156544208526611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,16,1,balanced,0.3872426748275757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,16,1,balanced,0.38784531752268475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,16,1,power_law_1.01,0.434335994720459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,16,1,power_law_1.01,0.435532808303833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,16,1,power_law_1.2,0.4375936031341553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,16,1,power_law_1.2,0.43863677978515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,2,1,balanced,0.720245361328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,2,1,balanced,0.7208853562672933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,2,1,power_law_1.01,0.8201087951660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,2,1,power_law_1.01,0.8212991714477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,2,1,power_law_1.2,0.8350208282470704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,2,1,power_law_1.2,0.8369791984558106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,32,1,balanced,0.36374934514363605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,32,1,balanced,0.3646186590194702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,32,1,power_law_1.01,0.4089791774749756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,32,1,power_law_1.01,0.40938878059387207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,32,1,power_law_1.2,0.41214718818664553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,32,1,power_law_1.2,0.4124608039855957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,4,1,balanced,0.521781325340271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,4,1,balanced,0.5238613287607828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,4,1,power_law_1.01,0.5819456100463867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,4,1,power_law_1.01,0.5829504013061524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,4,1,power_law_1.2,0.5927807807922363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,4,1,power_law_1.2,0.5940800189971924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,8,1,balanced,0.4352373282114665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,8,1,balanced,0.4354453484217326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,8,1,power_law_1.01,0.485427188873291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,8,1,power_law_1.01,0.48563199043273925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,8,1,power_law_1.2,0.48762240409851076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,1536,8,128,8,1,power_law_1.2,0.48975358009338377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,1,balanced,6.427610397338867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,1,balanced,6.431957244873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,1,power_law_1.01,6.948556518554687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,1,power_law_1.01,7.100460815429687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,1,power_law_1.2,7.2648193359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,1,power_law_1.2,7.337094116210937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,128,balanced,1.5310880343119304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,128,balanced,1.53166929880778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,128,power_law_1.01,1.5867072105407716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,128,power_law_1.01,1.5924223899841308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,128,power_law_1.2,1.6113536834716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,128,power_law_1.2,1.6247743606567382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,16,balanced,1.795786698659261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,16,balanced,1.8021012941996257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,16,power_law_1.01,1.8956287384033204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,16,power_law_1.01,1.9145536422729492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,16,power_law_1.2,1.9388927459716796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,16,power_law_1.2,1.9667648315429687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,2,balanced,4.053642590840657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,2,balanced,4.057658513387044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,2,power_law_1.01,4.1617279052734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,2,power_law_1.01,4.2636161804199215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,2,power_law_1.2,4.394534301757813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,2,power_law_1.2,4.471807861328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,256,balanced,1.5095146497090657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,256,balanced,1.5095787048339844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,256,power_law_1.01,1.5606016159057616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,256,power_law_1.01,1.5690879821777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,256,power_law_1.2,1.5791744232177733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,256,power_law_1.2,1.605401611328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,32,balanced,1.644015947977702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,32,balanced,1.6508906682332356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,32,power_law_1.01,1.7308095932006835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,32,power_law_1.01,1.7317184448242187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,32,power_law_1.2,1.7769407272338866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,32,power_law_1.2,1.7926912307739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,4,balanced,2.6738560994466147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,4,balanced,2.685130755106608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,4,power_law_1.01,2.8532032012939452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,4,power_law_1.01,2.8886783599853514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,4,power_law_1.2,2.962566375732422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,4,power_law_1.2,2.9666112899780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,64,balanced,1.567354679107666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,64,balanced,1.5694133440653484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,64,power_law_1.01,1.6371007919311524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,64,power_law_1.01,1.6466623306274415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,64,power_law_1.2,1.6869632720947265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,64,power_law_1.2,1.6923519134521485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,8,balanced,2.0965332984924316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,8,balanced,2.1028213500976562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,8,power_law_1.01,2.2075071334838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,8,power_law_1.01,2.2140607833862305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,8,power_law_1.2,2.2811904907226563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,1,8,power_law_1.2,2.2952512741088866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,16,1,balanced,11.019983927408854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,16,1,balanced,11.221125284830729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,16,1,power_law_1.01,11.990220642089843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,16,1,power_law_1.01,12.04870376586914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,16,1,power_law_1.2,12.240550231933593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,16,1,power_law_1.2,12.367378997802735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,2,1,balanced,3.66268253326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,2,1,balanced,4.145242691040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,2,1,power_law_1.01,3.7211841583251952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,2,1,power_law_1.01,3.7406272888183594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,2,1,power_law_1.2,3.7443073272705076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,2,1,power_law_1.2,3.8280704498291014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,32,1,balanced,8.05070940653483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,32,1,balanced,8.082538604736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,32,1,power_law_1.01,8.297555541992187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,32,1,power_law_1.01,8.343142700195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,32,1,power_law_1.2,8.51475830078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,32,1,power_law_1.2,8.522937774658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,4,1,balanced,2.312373320261637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,4,1,balanced,2.3346239725748696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,4,1,power_law_1.01,2.358028793334961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,4,1,power_law_1.01,2.3671039581298827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,4,1,power_law_1.2,2.3985023498535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,4,1,power_law_1.2,2.40067195892334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,8,1,balanced,1.6376372973124187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,8,1,balanced,1.6443467140197754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,8,1,power_law_1.01,1.6550399780273437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,8,1,power_law_1.01,1.6653568267822265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,8,1,power_law_1.2,1.6879232406616211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,4096,2688,22,512,8,1,power_law_1.2,1.6970880508422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,1,balanced,3.1140638987223306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,1,balanced,3.12880007425944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,1,power_law_1.01,3.0730815887451173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,1,power_law_1.01,3.109708786010742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,1,power_law_1.2,3.0398656845092775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,1,power_law_1.2,3.0592832565307617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,2,balanced,1.7603039741516113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,2,balanced,1.8070933024088542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,2,power_law_1.01,1.9814144134521485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,2,power_law_1.01,2.090496063232422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,2,power_law_1.2,2.088672065734863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,2,power_law_1.2,2.3567808151245115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,4,balanced,1.1332053343454997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,4,balanced,1.1521493593851726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,4,power_law_1.01,1.6105728149414062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,4,power_law_1.01,1.6573951721191407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,4,power_law_1.2,1.7700159072875976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,4,power_law_1.2,1.9809152603149414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,8,balanced,0.8943306605021158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,8,balanced,0.8952319622039795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,8,power_law_1.01,1.4554688453674316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,8,power_law_1.01,1.7246208190917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,8,power_law_1.2,1.5831487655639649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,1,8,power_law_1.2,1.7300352096557616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,16,1,balanced,0.3195679982503255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,16,1,balanced,0.32080533107121784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,16,1,power_law_1.01,0.3204031944274902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,16,1,power_law_1.01,0.3229248046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,16,1,power_law_1.2,0.3219712018966675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,16,1,power_law_1.2,0.32666239738464353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,2,1,balanced,1.5031147003173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,2,1,balanced,1.5164480209350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,2,1,power_law_1.01,1.5722111701965331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,2,1,power_law_1.01,1.593990421295166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,2,1,power_law_1.2,1.5713343620300293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,2,1,power_law_1.2,1.5940352439880372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,32,1,balanced,0.23433067401250204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,32,1,balanced,0.2360693415006002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,32,1,power_law_1.01,0.24128639698028564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,32,1,power_law_1.01,0.24182400703430176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,32,1,power_law_1.2,0.24057600498199463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,32,1,power_law_1.2,0.24174079895019532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,4,1,balanced,0.7957226435343424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,4,1,balanced,0.8082133134206136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,4,1,power_law_1.01,0.8429247856140136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,4,1,power_law_1.01,0.8598784446716309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,4,1,power_law_1.2,0.8338879585266114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,4,1,power_law_1.2,0.8570943832397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,8,1,balanced,0.4686346848805745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,8,1,balanced,0.47313066323598224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,8,1,power_law_1.01,0.4961599826812744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,8,1,power_law_1.01,0.5009664058685303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,8,1,power_law_1.2,0.497324800491333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,16384,2,8,8,1,power_law_1.2,0.49880318641662597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,1,balanced,2.4477759997049966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,1,balanced,2.4989493687947593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,1,power_law_1.01,3.0337024688720704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,1,power_law_1.01,3.1877824783325197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,1,power_law_1.2,3.2061439514160157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,1,power_law_1.2,3.2118526458740235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,128,balanced,0.637114683787028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,128,balanced,0.6373173395792643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,128,power_law_1.01,0.6772863864898682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,128,power_law_1.01,0.6855487823486328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,128,power_law_1.2,0.6993792057037354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,128,power_law_1.2,0.705676794052124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,16,balanced,0.7379946708679199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,16,balanced,0.7401173114776611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,16,power_law_1.01,0.8267135620117188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,16,power_law_1.01,0.8466239929199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,16,power_law_1.2,0.8826687812805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,16,power_law_1.2,0.9190079689025878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,2,balanced,1.542319933573405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,2,balanced,1.5599145889282227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,2,power_law_1.01,1.8941951751708985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,2,power_law_1.01,1.8978815078735352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,2,power_law_1.2,1.9791744232177735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,2,power_law_1.2,2.0108991622924806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,256,balanced,0.6308693488438925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,256,balanced,0.6320533355077108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,256,power_law_1.01,0.6655104160308838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,256,power_law_1.01,0.6655231952667237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,256,power_law_1.2,0.7000959873199463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,256,power_law_1.2,0.7019072055816651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,32,balanced,0.6788533528645834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,32,balanced,0.6802079677581787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,32,power_law_1.01,0.752294397354126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,32,power_law_1.01,0.755353593826294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,32,power_law_1.2,0.7716415882110595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,32,power_law_1.2,0.7991231918334961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,4,balanced,1.087989330291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,4,balanced,1.093664010365804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,4,power_law_1.01,1.2988415718078614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,4,power_law_1.01,1.329849624633789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,4,power_law_1.2,1.3594304084777833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,4,power_law_1.2,1.3740415573120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,64,balanced,0.6479413509368896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,64,balanced,0.6501546700795492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,64,power_law_1.01,0.7157695770263672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,64,power_law_1.01,0.7172160148620605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,64,power_law_1.2,0.7384448051452637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,64,power_law_1.2,0.7411263942718506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,8,balanced,0.8514026800791422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,8,balanced,0.8589066664377848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,8,power_law_1.01,1.0107968330383301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,8,power_law_1.01,1.0144319534301758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,8,power_law_1.2,1.0181568145751954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,1,8,power_law_1.2,1.0363200187683106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,16,1,balanced,0.5939786831537882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,16,1,balanced,0.5943306684494019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,16,1,power_law_1.01,0.7023104190826416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,16,1,power_law_1.01,0.7045631885528565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,16,1,power_law_1.2,0.7307583808898925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,16,1,power_law_1.2,0.7348415851593018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,2,1,balanced,1.394389311472575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,2,1,balanced,1.4128106435139973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,2,1,power_law_1.01,1.7458560943603516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,2,1,power_law_1.01,1.7779264450073242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,2,1,power_law_1.2,1.805504035949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,2,1,power_law_1.2,1.8059776306152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,32,1,balanced,0.5453973213831583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,32,1,balanced,0.5473973353703817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,32,1,power_law_1.01,0.6533567905426025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,32,1,power_law_1.01,0.6533631801605224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,32,1,power_law_1.2,0.6647039890289307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,32,1,power_law_1.2,0.6654848098754883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,4,1,balanced,0.9182506402333578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,4,1,balanced,0.9188480377197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,4,1,power_law_1.01,1.139571189880371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,4,1,power_law_1.01,1.1397760391235352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,4,1,power_law_1.2,1.16943359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,4,1,power_law_1.2,1.175648021697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,8,1,balanced,0.7074027061462402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,8,1,balanced,0.7093973159790039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,8,1,power_law_1.01,0.8411711692810059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,8,1,power_law_1.01,0.8414912223815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,8,1,power_law_1.2,0.8729791641235352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2048,8,256,8,1,power_law_1.2,0.8730239868164062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,1,balanced,3.063546816507975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,1,balanced,3.118618647257487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,1,power_law_1.01,3.071059226989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,1,power_law_1.01,3.1440959930419923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,1,power_law_1.2,3.181715202331543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,1,power_law_1.2,3.192889595031738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,16,balanced,0.7817440032958984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,16,balanced,0.783578634262085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,16,power_law_1.01,0.8807616233825684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,16,power_law_1.01,0.8908927917480469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,16,power_law_1.2,0.9102848052978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,16,power_law_1.2,0.9428928375244141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,2,balanced,1.7644319534301758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,2,balanced,1.9098827044169109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,2,power_law_1.01,1.9051008224487305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,2,power_law_1.01,1.9768384933471679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,2,power_law_1.2,2.0349567413330076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,2,power_law_1.2,2.050841522216797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,32,balanced,0.7094346682230631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,32,balanced,0.7098453044891357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,32,power_law_1.01,0.8195263862609863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,32,power_law_1.01,0.8221695899963379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,32,power_law_1.2,0.8566399574279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,32,power_law_1.2,0.867795181274414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,4,balanced,1.201578696568807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,4,balanced,1.2064800262451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,4,power_law_1.01,1.3470720291137694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,4,power_law_1.01,1.3766976356506349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,4,power_law_1.2,1.4040127754211427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,4,power_law_1.2,1.4287232398986816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,8,balanced,0.9203680356343588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,8,balanced,0.9212533632914225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,8,power_law_1.01,1.035801601409912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,8,power_law_1.01,1.07708797454834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,8,power_law_1.2,1.0761152267456056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,1,8,power_law_1.2,1.1090944290161133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,16,1,balanced,0.6686240037282308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,16,1,balanced,0.6706186930338541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,16,1,power_law_1.01,0.7013311862945557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,16,1,power_law_1.01,0.7026303768157959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,16,1,power_law_1.2,0.7064896106719971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,16,1,power_law_1.2,0.7082111835479736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,2,1,balanced,1.636672019958496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,2,1,balanced,1.689253330230713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,2,1,power_law_1.01,1.7350784301757813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,2,1,power_law_1.01,1.7714431762695313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,2,1,power_law_1.2,1.7836864471435547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,2,1,power_law_1.2,1.7839616775512694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,32,1,balanced,0.6045920054117838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,32,1,balanced,0.6072479883829752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,32,1,power_law_1.01,0.631059217453003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,32,1,power_law_1.01,0.6326528072357178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,32,1,power_law_1.2,0.6366335868835449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,32,1,power_law_1.2,0.6382912158966064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,4,1,balanced,1.0474239985148113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,4,1,balanced,1.049887975056966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,4,1,power_law_1.01,1.1263680458068848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,4,1,power_law_1.01,1.132646369934082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,4,1,power_law_1.2,1.140620803833008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,4,1,power_law_1.2,1.1456704139709473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,8,1,balanced,0.7731520334879557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,8,1,balanced,0.774720033009847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,8,1,power_law_1.01,0.8277183532714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,8,1,power_law_1.01,0.8337535858154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,8,1,power_law_1.2,0.8337663650512696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,6144,2560,8,160,8,1,power_law_1.2,0.8353664398193359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,1,balanced,2.860165278116862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,1,balanced,2.9191414515177407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,1,power_law_1.01,3.656768035888672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,1,power_law_1.01,3.6596351623535157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,1,power_law_1.2,3.6882686614990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,1,power_law_1.2,3.888896179199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,128,balanced,0.6965440114339193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,128,balanced,0.6990880171457926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,128,power_law_1.01,0.7470208168029785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,128,power_law_1.01,0.754201602935791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,128,power_law_1.2,0.7915328025817872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,128,power_law_1.2,0.7922048091888427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,16,balanced,0.8179893493652344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,16,balanced,0.8201546669006348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,16,power_law_1.01,0.9327872276306153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,16,power_law_1.01,0.9523903846740722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,16,power_law_1.2,0.950592041015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,16,power_law_1.2,0.981817626953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,2,balanced,1.7596267064412434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,2,balanced,1.7879947026570637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,2,power_law_1.01,2.200710487365723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,2,power_law_1.01,2.2030336380004885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,2,power_law_1.2,2.2416767120361327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,2,power_law_1.2,2.3301631927490236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,256,balanced,0.6918559869130453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,256,balanced,0.6941760381062826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,256,power_law_1.01,0.7296319961547851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,256,power_law_1.01,0.7321216106414795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,256,power_law_1.2,0.7767936229705811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,256,power_law_1.2,0.7808512210845947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,32,balanced,0.7460107008616129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,32,balanced,0.7475039958953857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,32,power_law_1.01,0.8351039886474609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,32,power_law_1.01,0.8468223571777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,32,power_law_1.2,0.874118423461914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,32,power_law_1.2,0.874630355834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,4,balanced,1.2246452967325847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,4,balanced,1.2260959943135579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,4,power_law_1.01,1.4820799827575684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,4,power_law_1.01,1.4901056289672852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,4,power_law_1.2,1.5287551879882812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,4,power_law_1.2,1.5782143592834472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,64,balanced,0.7077066898345947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,64,balanced,0.712287982304891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,64,power_law_1.01,0.7876736164093018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,64,power_law_1.01,0.7989696025848388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,64,power_law_1.2,0.8399999618530274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,64,power_law_1.2,0.8508864402770996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,8,balanced,0.9525813261667887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,8,balanced,0.9542400042215983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,8,power_law_1.01,1.0870207786560058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,8,power_law_1.01,1.137235164642334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,8,power_law_1.2,1.1899200439453126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,1,8,power_law_1.2,1.2157119750976562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,16,1,balanced,0.6776213645935059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,16,1,balanced,0.6793546676635742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,16,1,power_law_1.01,0.7993535995483398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,16,1,power_law_1.01,0.8040127754211426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,16,1,power_law_1.2,0.8349311828613282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,16,1,power_law_1.2,0.8396927833557128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,2,1,balanced,1.6260746320088704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,2,1,balanced,1.6341066360473633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,2,1,power_law_1.01,2.0169088363647463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,2,1,power_law_1.01,2.0234880447387695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,2,1,power_law_1.2,2.079232025146484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,2,1,power_law_1.2,2.0888320922851564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,32,1,balanced,0.6242026487986246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,32,1,balanced,0.6244853337605795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,32,1,power_law_1.01,0.7448063850402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,32,1,power_law_1.01,0.7464064121246338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,32,1,power_law_1.2,0.7597631931304931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,32,1,power_law_1.2,0.7606656074523925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,4,1,balanced,1.054474671681722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,4,1,balanced,1.0548373063405354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,4,1,power_law_1.01,1.3124799728393555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,4,1,power_law_1.01,1.3134016036987304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,4,1,power_law_1.2,1.3435903549194337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,4,1,power_law_1.2,1.3494720458984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,8,1,balanced,0.8144746621449789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,8,1,balanced,0.8145386377970377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,8,1,power_law_1.01,0.9661439895629883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,8,1,power_law_1.01,0.9857024192810059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,8,1,power_law_1.2,0.9983488082885742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,256,8,1,power_law_1.2,1.000972843170166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,1,balanced,3.936917304992676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,1,balanced,3.9815308252970376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,1,power_law_1.01,4.536563110351563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,1,power_law_1.01,4.614278411865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,1,power_law_1.2,4.7210430145263675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,1,power_law_1.2,4.735846328735351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,128,balanced,0.7606186866760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,128,balanced,0.760645310084025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,128,power_law_1.01,0.8039039611816406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,128,power_law_1.01,0.8072704315185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,128,power_law_1.2,0.8256319999694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,128,power_law_1.2,0.8287487983703613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,16,balanced,0.933024009068807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,16,balanced,0.9341333707173666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,16,power_law_1.01,1.0122048377990722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,16,power_law_1.01,1.0303615570068358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,16,power_law_1.2,1.0639167785644532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,16,power_law_1.2,1.0819904327392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,2,balanced,2.34715207417806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,2,balanced,2.3830453554789224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,2,power_law_1.01,2.5600767135620117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,2,power_law_1.01,2.5701696395874025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,2,power_law_1.2,2.766342353820801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,2,power_law_1.2,2.773664093017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,32,balanced,0.8366986910502116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,32,balanced,0.8380853335062662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,32,power_law_1.01,0.9047231674194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,32,power_law_1.01,0.9163392066955567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,32,power_law_1.2,0.9342975616455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,32,power_law_1.2,0.9377280235290527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,4,balanced,1.5167627334594727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,4,balanced,1.5181652704874675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,4,power_law_1.01,1.6905792236328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,4,power_law_1.01,1.707097625732422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,4,power_law_1.2,1.779520034790039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,4,power_law_1.2,1.7836992263793945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,64,balanced,0.7825866540273031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,64,balanced,0.7863787015279134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,64,power_law_1.01,0.8367168426513671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,64,power_law_1.01,0.8440959930419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,64,power_law_1.2,0.8678655624389648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,64,power_law_1.2,0.877017593383789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,8,balanced,1.1355253060658772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,8,balanced,1.1397813161214192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,8,power_law_1.01,1.2141887664794921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,8,power_law_1.01,1.2615872383117677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,8,power_law_1.2,1.3015616416931153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,1,8,power_law_1.2,1.3251263618469238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,16,1,balanced,0.8400320212046305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,16,1,balanced,0.8413706620534261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,16,1,power_law_1.01,0.9283647537231445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,16,1,power_law_1.01,0.9306176185607911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,16,1,power_law_1.2,0.9515199661254883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,16,1,power_law_1.2,0.9589887619018554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,2,1,balanced,2.162607987721761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,2,1,balanced,2.3095253308614097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,2,1,power_law_1.01,2.440902328491211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,2,1,power_law_1.01,2.4674816131591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,2,1,power_law_1.2,2.5430463790893554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,2,1,power_law_1.2,2.5724416732788087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,32,1,balanced,0.7770240306854248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,32,1,balanced,0.7775253454844157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,32,1,power_law_1.01,0.8364800453186035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,32,1,power_law_1.01,0.8386879920959472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,32,1,power_law_1.2,0.8594367980957032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,32,1,power_law_1.2,0.8654784202575684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,4,1,balanced,1.3732585906982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,4,1,balanced,1.3791839281717937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,4,1,power_law_1.01,1.5378687858581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,4,1,power_law_1.01,1.5472384452819825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,4,1,power_law_1.2,1.6185407638549805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,4,1,power_law_1.2,1.6212287902832032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,8,1,balanced,1.029034694035848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,8,1,balanced,1.0291253725687664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,8,1,power_law_1.01,1.1295231819152831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,8,1,power_law_1.01,1.132595157623291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,8,1,power_law_1.2,1.1753664016723633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,4096,7168,2048,8,384,8,1,power_law_1.2,1.178444766998291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,1,balanced,0.15146133303642273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,1,balanced,0.15226667126019797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,1,power_law_1.01,0.13751039505004883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,1,power_law_1.01,0.1378175973892212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,1,power_law_1.2,0.13738880157470704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,1,power_law_1.2,0.13916800022125245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,128,balanced,0.03257599969704946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,128,balanced,0.03348266581694285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,128,power_law_1.01,0.031948798894882204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,128,power_law_1.01,0.03311359882354736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,128,power_law_1.2,0.031481599807739256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,128,power_law_1.2,0.03189760148525238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,16,balanced,0.03931200007597605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,16,balanced,0.039808000127474465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,16,power_law_1.01,0.03770880103111267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,16,power_law_1.01,0.0380160003900528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,16,power_law_1.2,0.03689599931240082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,16,power_law_1.2,0.038176000118255615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,2,balanced,0.09723732868830363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,2,balanced,0.09777599573135376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,2,power_law_1.01,0.09025920033454896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,2,power_law_1.01,0.09045119881629944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,2,power_law_1.2,0.08814079761505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,2,power_law_1.2,0.09133440256118774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,32,balanced,0.03528533379236857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,32,balanced,0.03561066587766012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,32,power_law_1.01,0.03351680040359497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,32,power_law_1.01,0.03391999900341034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,32,power_law_1.2,0.03349120020866394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,32,power_law_1.2,0.03408640027046204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,4,balanced,0.06640000144640605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,4,balanced,0.06835733354091644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,4,power_law_1.01,0.06459519863128663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,4,power_law_1.01,0.06639360189437866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,4,power_law_1.2,0.06438400149345398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,4,power_law_1.2,0.06469119787216186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,64,balanced,0.03332266708215078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,64,balanced,0.033557333052158356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,64,power_law_1.01,0.032332798838615416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,64,power_law_1.01,0.03243519961833954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,64,power_law_1.2,0.0323199987411499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,64,power_law_1.2,0.032652801275253295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,8,balanced,0.047914668917655945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,8,balanced,0.0513919989267985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,8,power_law_1.01,0.04485760033130646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,8,power_law_1.01,0.04510720074176788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,8,power_law_1.2,0.04490880072116852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,1,8,power_law_1.2,0.04688639938831329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,2,1,balanced,0.09913600484530131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,2,1,balanced,0.0997226635615031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,2,1,power_law_1.01,0.0901311993598938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,2,1,power_law_1.01,0.09015679955482483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,2,1,power_law_1.2,0.09059839844703674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,2,1,power_law_1.2,0.09093120098114013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,4,1,balanced,0.07252266506354015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,4,1,balanced,0.0749013324578603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,4,1,power_law_1.01,0.06871680021286011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,4,1,power_law_1.01,0.07004799842834472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,4,1,power_law_1.2,0.06876800060272217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2048,768,8,128,4,1,power_law_1.2,0.06993280053138733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,1,balanced,0.3853120009104411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,1,balanced,0.3854186534881592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,1,power_law_1.01,0.3175168037414551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,1,power_law_1.01,0.32094080448150636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,1,power_law_1.2,0.3208575963973999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,1,power_law_1.2,0.32293760776519775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,128,balanced,0.03973866750796636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,128,balanced,0.03982399900754293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,128,power_law_1.01,0.03818239867687225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,128,power_law_1.01,0.0383103996515274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,128,power_law_1.2,0.038073599338531494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,128,power_law_1.2,0.03852800130844116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,16,balanced,0.06594133377075195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,16,balanced,0.0665280024210612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,16,power_law_1.01,0.06241919994354248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,16,power_law_1.01,0.06399999856948853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,16,power_law_1.2,0.06173440217971802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,16,power_law_1.2,0.06286079883575439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,2,balanced,0.21795733769734701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,2,balanced,0.21821333964665732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,2,power_law_1.01,0.19045120477676392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,2,power_law_1.01,0.19136639833450317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,2,power_law_1.2,0.18019839525222778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,2,power_law_1.2,0.19738240242004396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,32,balanced,0.045850664377212524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,32,balanced,0.047914668917655945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,32,power_law_1.01,0.04579200148582459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,32,power_law_1.01,0.045900800824165346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,32,power_law_1.2,0.04585599899291992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,32,power_law_1.2,0.04602240025997162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,4,balanced,0.1328159968058268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,4,balanced,0.13302933176358542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,4,power_law_1.01,0.1155392050743103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,4,power_law_1.01,0.1195520043373108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,4,power_law_1.2,0.11918079853057861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,4,power_law_1.2,0.12198400497436523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,64,balanced,0.04191466669241587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,64,balanced,0.043866669138272606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,64,power_law_1.01,0.04139519929885864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,64,power_law_1.01,0.04224640130996704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,64,power_law_1.2,0.04222719967365265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,64,power_law_1.2,0.04224640130996704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,8,balanced,0.09096533060073853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,8,balanced,0.09284800291061401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,8,power_law_1.01,0.08019199967384338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,8,power_law_1.01,0.08203520178794861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,8,power_law_1.2,0.08104320168495179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,1,8,power_law_1.2,0.08268160223960877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,16,1,balanced,0.24090667565663657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,16,1,balanced,0.2430186669031779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,16,1,power_law_1.01,0.19586559534072875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,16,1,power_law_1.01,0.21075839996337892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,16,1,power_law_1.2,0.20071039199829102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,16,1,power_law_1.2,0.2032831907272339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,2,1,balanced,0.22311466932296753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,2,1,balanced,0.2245546579360962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,2,1,power_law_1.01,0.1853824019432068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,2,1,power_law_1.01,0.1876479983329773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,2,1,power_law_1.2,0.1818943977355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,2,1,power_law_1.2,0.19018880128860474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,32,1,balanced,0.21647467215855917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,32,1,balanced,0.2166666587193807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,32,1,power_law_1.01,0.18076800107955932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,32,1,power_law_1.01,0.18859519958496093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,32,1,power_law_1.2,0.1759552001953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,32,1,power_law_1.2,0.18444160223007203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,4,1,balanced,0.1381333371003469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,4,1,balanced,0.13934933145840964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,4,1,power_law_1.01,0.11605759859085082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,4,1,power_law_1.01,0.11847679615020752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,4,1,power_law_1.2,0.11590399742126464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,4,1,power_law_1.2,0.11755520105361938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,8,1,balanced,0.3014666636784871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,8,1,balanced,0.3029279907544454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,8,1,power_law_1.01,0.2458751916885376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,8,1,power_law_1.01,0.24673919677734374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,8,1,power_law_1.2,0.24707839488983155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,2688,1856,6,128,8,1,power_law_1.2,0.24709761142730713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,1,balanced,0.6849119663238525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,1,balanced,0.9531359672546387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,1,power_law_1.01,0.5052800178527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,1,power_law_1.01,0.5070720195770264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,1,power_law_1.2,0.490777587890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,1,power_law_1.2,0.4992959976196289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,128,balanced,0.04368533194065094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,128,balanced,0.04384533564249674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,128,power_law_1.01,0.04049279987812042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,128,power_law_1.01,0.040550398826599124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,128,power_law_1.2,0.040934398770332336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,128,power_law_1.2,0.04100480079650879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,16,balanced,0.08534933129946391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,16,balanced,0.08681066830952962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,16,power_law_1.01,0.07899519801139832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,16,power_law_1.01,0.0818943977355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,16,power_law_1.2,0.07880319952964783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,16,power_law_1.2,0.08076800107955932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,2,balanced,0.38027199109395343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,2,balanced,0.38364267349243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,2,power_law_1.01,0.2817280054092407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,2,power_law_1.01,0.29687678813934326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,2,power_law_1.2,0.27102079391479494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,2,power_law_1.2,0.2763711929321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,256,balanced,0.03953066716591517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,256,balanced,0.04159999887148539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,256,power_law_1.01,0.03904640078544617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,256,power_law_1.01,0.039315199851989745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,256,power_law_1.2,0.03891839981079102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,256,power_law_1.2,0.03911679983139038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,32,balanced,0.06865066786607106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,32,balanced,0.06949333349863689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,32,power_law_1.01,0.058976000547409056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,32,power_law_1.01,0.0634112000465393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,32,power_law_1.2,0.062028801441192626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,32,power_law_1.2,0.06387199759483338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,4,balanced,0.20652800798416138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,4,balanced,0.21091733376185098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,4,power_law_1.01,0.15806080102920533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,4,power_law_1.01,0.1801599979400635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,4,power_law_1.2,0.16993919610977173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,4,power_law_1.2,0.1950271964073181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,64,balanced,0.047930667797724404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,64,balanced,0.04984533290068308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,64,power_law_1.01,0.04661119878292084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,64,power_law_1.01,0.04748159945011139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,64,power_law_1.2,0.04670720100402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,64,power_law_1.2,0.047142401337623596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,8,balanced,0.12834133704503378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,8,balanced,0.12872533003489176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,8,power_law_1.01,0.1099392056465149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,8,power_law_1.01,0.11312639713287354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,8,power_law_1.2,0.10807679891586304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,1,8,power_law_1.2,0.11273599863052368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,16,1,balanced,0.11137066284815471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,16,1,balanced,0.11231467127799988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,16,1,power_law_1.01,0.09075199961662292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,16,1,power_law_1.01,0.09224960207939148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,16,1,power_law_1.2,0.09040639996528625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,16,1,power_law_1.2,0.09121919870376587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,2,1,balanced,0.3761013348897298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,2,1,balanced,0.37618664900461835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,2,1,power_law_1.01,0.2773504018783569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,2,1,power_law_1.01,0.2809664011001587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,2,1,power_law_1.2,0.2742271900177002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,2,1,power_law_1.2,0.2754816055297852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,32,1,balanced,0.10002666711807251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,32,1,balanced,0.10108799735705058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,32,1,power_law_1.01,0.07822719812393189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,32,1,power_law_1.01,0.07889919877052307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,32,1,power_law_1.2,0.07824000120162963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,32,1,power_law_1.2,0.07897599935531616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,4,1,balanced,0.22234666347503662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,4,1,balanced,0.2294879953066508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,4,1,power_law_1.01,0.16782079935073851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,4,1,power_law_1.01,0.17153279781341552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,4,1,power_law_1.2,0.16739840507507325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,4,1,power_law_1.2,0.16853760480880736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,8,1,balanced,0.155648003021876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,8,1,balanced,0.1557919979095459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,8,1,power_law_1.01,0.12168960571289063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,8,1,power_law_1.01,0.12258559465408325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,8,1,power_law_1.2,0.11937919855117798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,3072,1536,8,256,8,1,power_law_1.2,0.12165119647979736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,1,balanced,0.3083733320236206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,1,balanced,0.308405339717865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,1,power_law_1.01,0.31989760398864747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,1,power_law_1.01,0.3290623903274536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,1,power_law_1.2,0.3272576093673706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,1,power_law_1.2,0.3358975887298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,2,balanced,0.22105065981547037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,2,balanced,0.22721066077550253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,2,power_law_1.01,0.2055232048034668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,2,power_law_1.01,0.20597760677337645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,2,power_law_1.2,0.21047039031982423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,2,power_law_1.2,0.2155456066131592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,4,balanced,0.15428266922632852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,4,balanced,0.1606559952100118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,4,power_law_1.01,0.15649280548095704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,4,power_law_1.01,0.15986560583114623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,4,power_law_1.2,0.1603008031845093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,4,power_law_1.2,0.1628864049911499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,8,balanced,0.12155733505884807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,8,balanced,0.12627200285593668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,8,power_law_1.01,0.12023040056228637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,8,power_law_1.01,0.13352320194244385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,8,power_law_1.2,0.13730560541152953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,1,8,power_law_1.2,0.14085760116577148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,16,1,balanced,0.046112000942230225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,16,1,balanced,0.04774933556715647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,16,1,power_law_1.01,0.047417598962783816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,16,1,power_law_1.01,0.04973439872264862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,16,1,power_law_1.2,0.04780800044536591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,16,1,power_law_1.2,0.04959999918937683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,2,1,balanced,0.18815465768178305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,2,1,balanced,0.21567465861638388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,2,1,power_law_1.01,0.18029439449310303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,2,1,power_law_1.01,0.1837183952331543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,2,1,power_law_1.2,0.17176320552825927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,2,1,power_law_1.2,0.18192000389099122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,32,1,balanced,0.035631999373435974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,32,1,balanced,0.03734400123357773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,32,1,power_law_1.01,0.034790399670600894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,32,1,power_law_1.01,0.0348800003528595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,32,1,power_law_1.2,0.035174399614334106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,32,1,power_law_1.2,0.035411199927330016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,4,1,balanced,0.10754133264223735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,4,1,balanced,0.10847466190656026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,4,1,power_law_1.01,0.10497920513153076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,4,1,power_law_1.01,0.10616320371627808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,4,1,power_law_1.2,0.10574719905853272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,4,1,power_law_1.2,0.10845439434051514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,8,1,balanced,0.07378133138020833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,8,1,balanced,0.07454933226108551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,8,1,power_law_1.01,0.06872959733009339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,8,1,power_law_1.01,0.071424001455307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,8,1,power_law_1.2,0.06963199973106385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,14336,2,8,8,1,power_law_1.2,0.07032319903373718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,1,balanced,0.46933865547180176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,1,balanced,0.4704373280207316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,1,power_law_1.01,0.413804817199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,1,power_law_1.01,0.4182464122772217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,1,power_law_1.2,0.41612801551818845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,1,power_law_1.2,0.41867518424987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,128,balanced,0.041450666884581246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,128,balanced,0.04180799921353658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,128,power_law_1.01,0.04110080003738403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,128,power_law_1.01,0.04200319945812225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,128,power_law_1.2,0.040652799606323245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,128,power_law_1.2,0.041484799981117246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,16,balanced,0.07858666777610779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,16,balanced,0.07902400195598602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,16,power_law_1.01,0.07349119782447815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,16,power_law_1.01,0.07365760207176208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,16,power_law_1.2,0.07322880029678344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,16,power_law_1.2,0.07354879975318909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,2,balanced,0.2593013246854146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,2,balanced,0.25939732789993286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,2,power_law_1.01,0.23015038967132567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,2,power_law_1.01,0.2370431900024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,2,power_law_1.2,0.23096959590911864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,2,power_law_1.2,0.24324479103088378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,32,balanced,0.05376533170541128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,32,balanced,0.054154664278030396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,32,power_law_1.01,0.05259519815444946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,32,power_law_1.01,0.05397760272026062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,32,power_law_1.2,0.051648002862930295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,32,power_law_1.2,0.05211520195007324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,4,balanced,0.15553067127863565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,4,balanced,0.15707199772198996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,4,power_law_1.01,0.1388543963432312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,4,power_law_1.01,0.14419200420379638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,4,power_law_1.2,0.1421504020690918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,4,power_law_1.2,0.14303359985351563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,64,balanced,0.0455626646677653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,64,balanced,0.045797333121299744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,64,power_law_1.01,0.0433023989200592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,64,power_law_1.01,0.04371199905872345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,64,power_law_1.2,0.04283519983291626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,64,power_law_1.2,0.043833601474761966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,8,balanced,0.1009386678536733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,8,balanced,0.10122666756312053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,8,power_law_1.01,0.09812480211257935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,8,power_law_1.01,0.09831680059432983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,8,power_law_1.2,0.09413759708404541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,1,8,power_law_1.2,0.09651200175285339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,16,1,balanced,0.08619200189908345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,16,1,balanced,0.08754133184750874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,16,1,power_law_1.01,0.08001919984817504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,16,1,power_law_1.01,0.08058879971504211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,16,1,power_law_1.2,0.08083840012550354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,16,1,power_law_1.2,0.08135039806365967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,2,1,balanced,0.2642880082130432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,2,1,balanced,0.2648213307062785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,2,1,power_law_1.01,0.2331007957458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,2,1,power_law_1.01,0.23359999656677247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,2,1,power_law_1.2,0.23474559783935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,2,1,power_law_1.2,0.2360383987426758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,32,1,balanced,0.07296533385912578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,32,1,balanced,0.07387199997901917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,32,1,power_law_1.01,0.06852480173110961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,32,1,power_law_1.01,0.06883199810981751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,32,1,power_law_1.2,0.06928640007972717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,32,1,power_law_1.2,0.0695360004901886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,4,1,balanced,0.16309866309165955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,4,1,balanced,0.1637333333492279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,4,1,power_law_1.01,0.14663679599761964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,4,1,power_law_1.01,0.14773759841918946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,4,1,power_law_1.2,0.14517120122909546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,4,1,power_law_1.2,0.14714239835739135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,8,1,balanced,0.11578133702278137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,8,1,balanced,0.11643733580907185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,8,1,power_law_1.01,0.1081279993057251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,8,1,power_law_1.01,0.10849920511245728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,8,1,power_law_1.2,0.10639359951019287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,1536,8,128,8,1,power_law_1.2,0.10932480096817017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,1,balanced,2.969349225362142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,1,balanced,2.973439852396647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,1,power_law_1.01,2.3566848754882814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,1,power_law_1.01,2.362918472290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,1,power_law_1.2,2.3427839279174805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,1,power_law_1.2,2.382111930847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,128,balanced,0.09893332918485005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,128,balanced,0.09940800070762634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,128,power_law_1.01,0.09605759978294373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,128,power_law_1.01,0.09755520224571228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,128,power_law_1.2,0.09550079703330994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,128,power_law_1.2,0.09777920246124268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,16,balanced,0.2645653287569682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,16,balanced,0.26496533552805585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,16,power_law_1.01,0.23629438877105713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,16,power_law_1.01,0.24229118824005128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,16,power_law_1.2,0.23697919845581056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,16,power_law_1.2,0.24191360473632811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,2,balanced,1.5238080024719238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,2,balanced,1.5245812733968098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,2,power_law_1.01,1.2573439598083496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,2,power_law_1.01,1.271571159362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,2,power_law_1.2,1.2468992233276368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,2,power_law_1.2,1.2783935546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,256,balanced,0.08304533362388611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,256,balanced,0.08474133412043254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,256,power_law_1.01,0.08127359747886657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,256,power_law_1.01,0.0825215995311737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,256,power_law_1.2,0.08030080199241638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,256,power_law_1.2,0.080595201253891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,32,balanced,0.1732213298479716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,32,balanced,0.1738719940185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,32,power_law_1.01,0.15941760540008545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,32,power_law_1.01,0.16195839643478394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,32,power_law_1.2,0.16005760431289673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,32,power_law_1.2,0.16210559606552125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,4,balanced,0.8037013212839762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,4,balanced,0.8037652969360352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,4,power_law_1.01,0.671724796295166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,4,power_law_1.01,0.6837056159973145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,4,power_law_1.2,0.7001920223236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,4,power_law_1.2,0.7172863960266114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,64,balanced,0.12417067090670268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,64,balanced,0.12570666273434958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,64,power_law_1.01,0.11628160476684571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,64,power_law_1.01,0.1194815993309021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,64,power_law_1.2,0.11498880386352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,64,power_law_1.2,0.1189120054244995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,8,balanced,0.44314666589101154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,8,balanced,0.44413332144419354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,8,power_law_1.01,0.393939208984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,8,power_law_1.01,0.4178880214691162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,8,power_law_1.2,0.36583681106567384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,1,8,power_law_1.2,0.4300032138824463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,16,1,balanced,1.586858590443929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,16,1,balanced,1.5900640487670898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,16,1,power_law_1.01,1.2654848098754883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,16,1,power_law_1.01,1.2807744026184082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,16,1,power_law_1.2,1.2582592010498046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,16,1,power_law_1.2,1.2802687644958497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,2,1,balanced,1.569973309834798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,2,1,balanced,1.6028213500976562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,2,1,power_law_1.01,1.2441344261169434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,2,1,power_law_1.01,1.2478976249694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,2,1,power_law_1.2,1.234931182861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,2,1,power_law_1.2,1.235091209411621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,32,1,balanced,1.2581760088602703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,32,1,balanced,1.2582613627115886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,32,1,power_law_1.01,1.0117695808410645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,32,1,power_law_1.01,1.0156991958618165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,32,1,power_law_1.2,1.0040767669677735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,32,1,power_law_1.2,1.006105613708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,4,1,balanced,0.8703359762827555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,4,1,balanced,0.871018648147583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,4,1,power_law_1.01,0.6994239807128906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,4,1,power_law_1.01,0.701478385925293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,4,1,power_law_1.2,0.6983488082885743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,4,1,power_law_1.2,0.6994431972503662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,8,1,balanced,0.5134026606877645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,8,1,balanced,0.5336000124613444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,8,1,power_law_1.01,0.4132351875305176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,8,1,power_law_1.01,0.41541762351989747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,8,1,power_law_1.2,0.40792322158813477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,4096,2688,22,512,8,1,power_law_1.2,0.4085247993469238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,1,balanced,0.48816001415252686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,1,balanced,0.4945066769917806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,1,power_law_1.01,0.5034239768981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,1,power_law_1.01,0.5045951843261719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,1,power_law_1.2,0.4869696140289307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,1,power_law_1.2,0.5114240169525146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,2,balanced,0.30844799677530926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,2,balanced,0.3274773359298706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,2,power_law_1.01,0.3241600036621094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,2,power_law_1.01,0.3256256103515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,2,power_law_1.2,0.31415040493011476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,2,power_law_1.2,0.3258879899978638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,4,balanced,0.2178879976272583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,4,balanced,0.21993066867192587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,4,power_law_1.01,0.20257279872894288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,4,power_law_1.01,0.21440000534057618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,4,power_law_1.2,0.21699841022491456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,4,power_law_1.2,0.2181567907333374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,8,balanced,0.1591253379980723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,8,balanced,0.1607093314329783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,8,power_law_1.01,0.16903040409088135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,8,power_law_1.01,0.17634559869766236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,8,power_law_1.2,0.1690111994743347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,1,8,power_law_1.2,0.16992000341415406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,16,1,balanced,0.07047999898592631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,16,1,balanced,0.07239999870459239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,16,1,power_law_1.01,0.06819199919700622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,16,1,power_law_1.01,0.07054719924926758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,16,1,power_law_1.2,0.0707584023475647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,16,1,power_law_1.2,0.07343360185623168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,2,1,balanced,0.26950399080912274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,2,1,balanced,0.2937120000521342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,2,1,power_law_1.01,0.27050879001617434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,2,1,power_law_1.01,0.27871999740600584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,2,1,power_law_1.2,0.2671168088912964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,2,1,power_law_1.2,0.28999040126800535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,32,1,balanced,0.045834665497144066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,32,1,balanced,0.04774933556715647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,32,1,power_law_1.01,0.04643200039863586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,32,1,power_law_1.01,0.05296639800071716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,32,1,power_law_1.2,0.0482367992401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,32,1,power_law_1.2,0.04881280064582825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,4,1,balanced,0.1590986649195353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,4,1,balanced,0.19637332359949747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,4,1,power_law_1.01,0.1584831953048706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,4,1,power_law_1.01,0.15854079723358155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,4,1,power_law_1.2,0.16105600595474243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,4,1,power_law_1.2,0.1710271954536438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,8,1,balanced,0.10597866773605347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,8,1,balanced,0.11211733023325603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,8,1,power_law_1.01,0.09520000219345093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,8,1,power_law_1.01,0.09562240242958069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,8,1,power_law_1.2,0.09624320268630981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,16384,2,8,8,1,power_law_1.2,0.09899520277976989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,1,balanced,1.7334720293680828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,1,balanced,1.816805362701416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,1,power_law_1.01,1.233523178100586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,1,power_law_1.01,1.2639039993286132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,1,power_law_1.2,1.2333248138427735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,1,power_law_1.2,1.2430784225463867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,128,balanced,0.06606400012969971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,128,balanced,0.06704000135262807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,128,power_law_1.01,0.06652160286903382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,128,power_law_1.01,0.0667136013507843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,128,power_law_1.2,0.066348797082901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,128,power_law_1.2,0.06739839911460876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,16,balanced,0.16966400543848673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,16,balanced,0.17087467511494955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,16,power_law_1.01,0.145305597782135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,16,power_law_1.01,0.14565119743347169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,16,power_law_1.2,0.1351359963417053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,16,power_law_1.2,0.140556800365448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,2,balanced,0.8976426919301351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,2,balanced,0.9062986373901367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,2,power_law_1.01,0.6831424236297607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,2,power_law_1.01,0.6915840148925781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,2,power_law_1.2,0.6390079975128173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,2,power_law_1.2,0.703443193435669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,256,balanced,0.056128000219662987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,256,balanced,0.05782933533191681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,256,power_law_1.01,0.0551360011100769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,256,power_law_1.01,0.05585920214653015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,256,power_law_1.2,0.05553280115127564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,256,power_law_1.2,0.05583999752998352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,32,balanced,0.11718400319417317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,32,balanced,0.11743999520937602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,32,power_law_1.01,0.10581120252609252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,32,power_law_1.01,0.10720000267028809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,32,power_law_1.2,0.10229760408401489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,32,power_law_1.2,0.10773760080337524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,4,balanced,0.47381333510080975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,4,balanced,0.4901546637217204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,4,power_law_1.01,0.3589567899703979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,4,power_law_1.01,0.40694398880004884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,4,power_law_1.2,0.3654720067977905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,4,power_law_1.2,0.41841278076171873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,64,balanced,0.0885653297106425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,64,balanced,0.08892266949017842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,64,power_law_1.01,0.08489599823951721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,64,power_law_1.01,0.0871999979019165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,64,power_law_1.2,0.08057600259780884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,64,power_law_1.2,0.08300799727439881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,8,balanced,0.2707466681798299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,8,balanced,0.271013339360555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,8,power_law_1.01,0.24895360469818115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,8,power_law_1.01,0.26512000560760496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,8,power_law_1.2,0.2282111883163452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,1,8,power_law_1.2,0.23501439094543458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,16,1,balanced,0.21349332729975382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,16,1,balanced,0.21517332394917807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,16,1,power_law_1.01,0.16257280111312866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,16,1,power_law_1.01,0.16302080154418946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,16,1,power_law_1.2,0.1619968056678772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,16,1,power_law_1.2,0.163372802734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,2,1,balanced,0.9177760283152262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,2,1,balanced,0.9181439876556396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,2,1,power_law_1.01,0.666156816482544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,2,1,power_law_1.01,0.6703104019165039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,2,1,power_law_1.2,0.662559986114502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,2,1,power_law_1.2,0.668236780166626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,32,1,balanced,0.1713493267695109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,32,1,balanced,0.17197332779566446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,32,1,power_law_1.01,0.13738240003585817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,32,1,power_law_1.01,0.13831039667129516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,32,1,power_law_1.2,0.135481595993042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,32,1,power_law_1.2,0.13674880266189576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,4,1,balanced,0.5103520154953003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,4,1,balanced,0.5112799803415934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,4,1,power_law_1.01,0.38099839687347414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,4,1,power_law_1.01,0.3819967985153198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,4,1,power_law_1.2,0.37306239604949953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,4,1,power_law_1.2,0.37742080688476565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,8,1,balanced,0.3120800058046977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,8,1,balanced,0.3129013379414876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,8,1,power_law_1.01,0.2358720064163208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,8,1,power_law_1.01,0.24174718856811522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,8,1,power_law_1.2,0.22951040267944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2048,8,256,8,1,power_law_1.2,0.23185279369354247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,1,balanced,1.3581387201944988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,1,balanced,1.398047924041748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,1,power_law_1.01,1.1081024169921876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,1,power_law_1.01,1.1263296127319335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,1,power_law_1.2,1.107603168487549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,1,power_law_1.2,1.1328319549560546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,16,balanced,0.1378506620724996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,16,balanced,0.1388053297996521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,16,power_law_1.01,0.12928639650344848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,16,power_law_1.01,0.13171839714050293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,16,power_law_1.2,0.13193600177764891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,16,power_law_1.2,0.13257600069046022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,2,balanced,0.7091946601867676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,2,balanced,0.7120107014973959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,2,power_law_1.01,0.6023168087005615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,2,power_law_1.01,0.6049215793609619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,2,power_law_1.2,0.5846784114837646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,2,power_law_1.2,0.5854015827178956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,32,balanced,0.0990613301595052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,32,balanced,0.09917866190274556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,32,power_law_1.01,0.0950655996799469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,32,power_law_1.01,0.09617279767990113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,32,power_law_1.2,0.09303039908409119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,32,power_law_1.2,0.09446399807929992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,4,balanced,0.37928001085917157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,4,balanced,0.43900267283121747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,4,power_law_1.01,0.3513024091720581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,4,power_law_1.01,0.3543616056442261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,4,power_law_1.2,0.32444798946380615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,4,power_law_1.2,0.350816011428833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,8,balanced,0.21495999892552695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,8,balanced,0.2164799968401591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,8,power_law_1.01,0.19897600412368774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,8,power_law_1.01,0.20659201145172118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,8,power_law_1.2,0.17994240522384644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,1,8,power_law_1.2,0.19041919708251953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,16,1,balanced,0.17679466803868613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,16,1,balanced,0.17681600650151572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,16,1,power_law_1.01,0.1547327995300293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,16,1,power_law_1.01,0.1570304036140442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,16,1,power_law_1.2,0.15387519598007202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,16,1,power_law_1.2,0.15673600435256957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,2,1,balanced,0.7205386956532797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,2,1,balanced,0.7210079828898112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,2,1,power_law_1.01,0.5974080085754394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,2,1,power_law_1.01,0.6053184032440185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,2,1,power_law_1.2,0.6033535957336426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,2,1,power_law_1.2,0.6085887908935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,32,1,balanced,0.13529066244761148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,32,1,balanced,0.1362666686375936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,32,1,power_law_1.01,0.11750400066375732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,32,1,power_law_1.01,0.11767040491104126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,32,1,power_law_1.2,0.11615999937057495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,32,1,power_law_1.2,0.11653759479522705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,4,1,balanced,0.398037314414978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,4,1,balanced,0.39899198214213055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,4,1,power_law_1.01,0.33688960075378416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,4,1,power_law_1.01,0.33714559078216555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,4,1,power_law_1.2,0.33628799915313723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,4,1,power_law_1.2,0.3382719993591309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,8,1,balanced,0.24897066752115884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,8,1,balanced,0.2529066602389018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,8,1,power_law_1.01,0.21200640201568605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,8,1,power_law_1.01,0.21638400554656984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,8,1,power_law_1.2,0.21304960250854493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,6144,2560,8,160,8,1,power_law_1.2,0.22117118835449218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,1,balanced,2.0064266522725425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,1,balanced,2.0099892616271973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,1,power_law_1.01,1.4623680114746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,1,power_law_1.01,1.4774335861206054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,1,power_law_1.2,1.4547776222229003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,1,power_law_1.2,1.4554112434387207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,128,balanced,0.07789333164691925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,128,balanced,0.08019733428955078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,128,power_law_1.01,0.0771776020526886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,128,power_law_1.01,0.07776640057563781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,128,power_law_1.2,0.07923200130462646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,128,power_law_1.2,0.07985280156135559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,16,balanced,0.19236266613006592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,16,balanced,0.193066676457723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,16,power_law_1.01,0.16904959678649903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,16,power_law_1.01,0.18294399976730347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,16,power_law_1.2,0.16607999801635742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,16,power_law_1.2,0.1746240019798279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,2,balanced,1.037717342376709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,2,balanced,1.039199988047282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,2,power_law_1.01,0.794265604019165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,2,power_law_1.01,0.8018239974975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,2,power_law_1.2,0.7771391868591309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,2,power_law_1.2,0.8150015830993652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,256,balanced,0.06221333146095276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,256,balanced,0.062496001521746315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,256,power_law_1.01,0.06151679754257202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,256,power_law_1.01,0.06170880198478699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,256,power_law_1.2,0.060812801122665405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,256,power_law_1.2,0.06638079881668091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,32,balanced,0.13010666767756143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,32,balanced,0.1304639975229899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,32,power_law_1.01,0.11618560552597046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,32,power_law_1.01,0.12057600021362305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,32,power_law_1.2,0.12235519886016846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,32,power_law_1.2,0.12265599966049194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,4,balanced,0.5609493255615234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,4,balanced,0.74944535891215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,4,power_law_1.01,0.4488192081451416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,4,power_law_1.01,0.45827198028564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,4,power_law_1.2,0.42466559410095217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,4,power_law_1.2,0.48214402198791506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,64,balanced,0.09885332981745402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,64,balanced,0.09896000226338704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,64,power_law_1.01,0.09293439984321594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,64,power_law_1.01,0.09711359739303589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,64,power_law_1.2,0.09184640049934387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,64,power_law_1.2,0.09628159999847412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,8,balanced,0.3113226691881816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,8,balanced,0.32174400488535565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,8,power_law_1.01,0.26645760536193847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,8,power_law_1.01,0.2730815887451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,8,power_law_1.2,0.2482304096221924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,1,8,power_law_1.2,0.2803647994995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,16,1,balanced,0.24764267603556314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,16,1,balanced,0.25031999746958417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,16,1,power_law_1.01,0.18523520231246948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,16,1,power_law_1.01,0.18635519742965698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,16,1,power_law_1.2,0.18484480381011964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,16,1,power_law_1.2,0.1859455943107605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,2,1,balanced,1.0645919640858967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,2,1,balanced,1.0742666721343994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,2,1,power_law_1.01,0.7711872100830078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,2,1,power_law_1.01,0.7771008014678955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,2,1,power_law_1.2,0.7545023918151855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,2,1,power_law_1.2,0.7596864223480224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,32,1,balanced,0.19534399112065634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,32,1,balanced,0.19645333290100098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,32,1,power_law_1.01,0.15675519704818724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,32,1,power_law_1.01,0.15779839754104613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,32,1,power_law_1.2,0.1535040020942688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,32,1,power_law_1.2,0.15421439409255983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,4,1,balanced,0.5901866753896078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,4,1,balanced,0.5933813254038492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,4,1,power_law_1.01,0.44399361610412597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,4,1,power_law_1.01,0.44593281745910646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,4,1,power_law_1.2,0.43205761909484863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,4,1,power_law_1.2,0.43561601638793945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,8,1,balanced,0.36265599727630615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,8,1,balanced,0.3678453365961711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,8,1,power_law_1.01,0.2700671911239624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,8,1,power_law_1.01,0.2743680000305176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,8,1,power_law_1.2,0.26485118865966795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,256,8,1,power_law_1.2,0.2652031898498535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,1,balanced,3.126842816670736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,1,balanced,3.1684160232543945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,1,power_law_1.01,1.51910400390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,1,power_law_1.01,1.5286656379699708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,1,power_law_1.2,1.394803237915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,1,power_law_1.2,1.4404800415039063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,128,balanced,0.09620799620946248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,128,balanced,0.09724799791971843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,128,power_law_1.01,0.09228159785270691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,128,power_law_1.01,0.09348480105400085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,128,power_law_1.2,0.09241600036621093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,128,power_law_1.2,0.09248639941215515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,16,balanced,0.252400000890096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,16,balanced,0.25417067607243854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,16,power_law_1.01,0.1893183946609497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,16,power_law_1.01,0.24204800128936768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,16,power_law_1.2,0.19482879638671874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,16,power_law_1.2,0.21593599319458007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,2,balanced,1.5303893089294434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,2,balanced,1.5309707323710124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,2,power_law_1.01,0.8228672027587891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,2,power_law_1.01,0.8848896026611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,2,power_law_1.2,0.7933184146881104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,2,power_law_1.2,0.8620927810668946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,32,balanced,0.1620319982369741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,32,balanced,0.1623093287150065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,32,power_law_1.01,0.13325439691543578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,32,power_law_1.01,0.14287359714508058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,32,power_law_1.2,0.1380288004875183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,32,power_law_1.2,0.14328320026397706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,4,balanced,0.7999893029530843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,4,balanced,0.8010453383127848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,4,power_law_1.01,0.4847616195678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,4,power_law_1.01,0.5826687812805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,4,power_law_1.2,0.5520832061767578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,4,power_law_1.2,0.5558271884918213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,64,balanced,0.12032000223795573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,64,balanced,0.12237866719563802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,64,power_law_1.01,0.10714240074157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,64,power_law_1.01,0.10847359895706177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,64,power_law_1.2,0.10432000160217285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,64,power_law_1.2,0.10633599758148193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,8,balanced,0.434224009513855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,8,balanced,0.43775467077891034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,8,power_law_1.01,0.30678400993347166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,8,power_law_1.01,0.3916287899017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,8,power_law_1.2,0.40601601600646975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,1,8,power_law_1.2,0.42539520263671876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,16,1,balanced,0.3333706855773926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,16,1,balanced,0.33371198177337646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,16,1,power_law_1.01,0.194649600982666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,16,1,power_law_1.01,0.19853440523147584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,16,1,power_law_1.2,0.18989440202713012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,16,1,power_law_1.2,0.19070719480514525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,2,1,balanced,1.5724746386210124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,2,1,balanced,1.5741119384765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,2,1,power_law_1.01,0.8233471870422363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,2,1,power_law_1.01,0.8247167587280273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,2,1,power_law_1.2,0.7412543773651123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,2,1,power_law_1.2,0.7470016002655029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,32,1,balanced,0.2733280062675476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,32,1,balanced,0.27348800500233966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,32,1,power_law_1.01,0.17095040082931517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,32,1,power_law_1.01,0.1748095989227295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,32,1,power_law_1.2,0.16005120277404786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,32,1,power_law_1.2,0.16051199436187744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,4,1,balanced,0.86244797706604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,4,1,balanced,0.8632853031158447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,4,1,power_law_1.01,0.45967998504638674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,4,1,power_law_1.01,0.4683328151702881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,4,1,power_law_1.2,0.43218560218811036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,4,1,power_law_1.2,0.4364160060882568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,8,1,balanced,0.5085920095443726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,8,1,balanced,0.5097440083821615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,8,1,power_law_1.01,0.2857088088989258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,8,1,power_law_1.01,0.29005439281463624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,8,1,power_law_1.2,0.2668287992477417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,48,7168,2048,8,384,8,1,power_law_1.2,0.2706496000289917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,1,balanced,0.16293332974116007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,1,balanced,0.16310933232307434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,1,power_law_1.01,0.17142399549484252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,1,power_law_1.01,0.17164160013198854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,1,power_law_1.2,0.17181440591812133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,1,power_law_1.2,0.17240959405899048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,128,balanced,0.06840533514817555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,128,balanced,0.06844800213972728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,128,power_law_1.01,0.06787840127944947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,128,power_law_1.01,0.06993920207023621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,128,power_law_1.2,0.06837120056152343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,128,power_law_1.2,0.06928640007972717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,16,balanced,0.07201600074768066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,16,balanced,0.07215466598669688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,16,power_law_1.01,0.07325440049171447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,16,power_law_1.01,0.07456640005111695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,16,power_law_1.2,0.0720255970954895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,16,power_law_1.2,0.07338240146636962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,2,balanced,0.11987732847531636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,2,balanced,0.11989866693814595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,2,power_law_1.01,0.12563199996948243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,2,power_law_1.01,0.12624000310897826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,2,power_law_1.2,0.1277184009552002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,2,power_law_1.2,0.12818559408187866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,32,balanced,0.0683840016523997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,32,balanced,0.06966933111349742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,32,power_law_1.01,0.06881279945373535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,32,power_law_1.01,0.06906880140304565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,32,power_law_1.2,0.06972159743309021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,32,power_law_1.2,0.06974080204963684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,4,balanced,0.09707732995351155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,4,balanced,0.09935999910036723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,4,power_law_1.01,0.09978240132331848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,4,power_law_1.01,0.10021120309829712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,4,power_law_1.2,0.10021760463714599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,4,power_law_1.2,0.10055680274963379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,64,balanced,0.068271999557813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,64,balanced,0.06838933130105336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,64,power_law_1.01,0.06867200136184692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,64,power_law_1.01,0.06872320175170898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,64,power_law_1.2,0.06917759776115417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,64,power_law_1.2,0.06936320066452026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,8,balanced,0.07846400141716003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,8,balanced,0.07875200112660725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,8,power_law_1.01,0.08230400085449219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,8,power_law_1.01,0.08298239707946778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,8,power_law_1.2,0.08437119722366333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,1,8,power_law_1.2,0.08460800051689148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,2,1,balanced,0.10934399565060933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,2,1,balanced,0.11142399907112122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,2,1,power_law_1.01,0.11739519834518433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,2,1,power_law_1.01,0.11745920181274414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,2,1,power_law_1.2,0.1191167950630188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,2,1,power_law_1.2,0.11946239471435546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,4,1,balanced,0.08855467041333516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,4,1,balanced,0.08950933814048767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,4,1,power_law_1.01,0.09669119715690613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,4,1,power_law_1.01,0.09710080027580262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,4,1,power_law_1.2,0.09675520062446594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2048,768,8,128,4,1,power_law_1.2,0.0971455991268158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,1,balanced,0.37939735253651935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,1,balanced,0.37985066572825116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,1,power_law_1.01,0.3752000093460083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,1,power_law_1.01,0.3758080005645752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,1,power_law_1.2,0.38226559162139895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,1,power_law_1.2,0.38353919982910156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,128,balanced,0.09090666969617207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,128,balanced,0.0927946666876475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,128,power_law_1.01,0.09204480051994324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,128,power_law_1.01,0.09304959774017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,128,power_law_1.2,0.0926144003868103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,128,power_law_1.2,0.09281280040740966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,16,balanced,0.10518399874369304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,16,balanced,0.10524266958236694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,16,power_law_1.01,0.1071679949760437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,16,power_law_1.01,0.11176960468292237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,16,power_law_1.2,0.11075199842453003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,16,power_law_1.2,0.11172480583190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,2,balanced,0.24866666396458945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,2,balanced,0.24911999702453613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,2,power_law_1.01,0.2408384084701538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,2,power_law_1.01,0.24260480403900148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,2,power_law_1.2,0.2416383981704712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,2,power_law_1.2,0.24955520629882813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,32,balanced,0.09673600395520528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,32,balanced,0.0969599982102712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,32,power_law_1.01,0.09832320213317872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,32,power_law_1.01,0.09937279820442199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,32,power_law_1.2,0.10059520006179809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,32,power_law_1.2,0.10179840326309204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,4,balanced,0.17384533087412515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,4,balanced,0.1754080057144165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,4,power_law_1.01,0.16777600049972535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,4,power_law_1.01,0.17433600425720214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,4,power_law_1.2,0.17329280376434325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,4,power_law_1.2,0.17333120107650757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,64,balanced,0.09297066926956177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,64,balanced,0.09458133578300476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,64,power_law_1.01,0.09251840114593506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,64,power_law_1.01,0.09736319780349731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,64,power_law_1.2,0.09537919759750366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,64,power_law_1.2,0.09559680223464966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,8,balanced,0.1339040001233419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,8,balanced,0.13446399569511414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,8,power_law_1.01,0.13548799753189086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,8,power_law_1.01,0.1364416003227234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,8,power_law_1.2,0.13276159763336182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,1,8,power_law_1.2,0.13445119857788085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,16,1,balanced,0.3380426565806071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,16,1,balanced,0.33874134222666424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,16,1,power_law_1.01,0.3577536106109619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,16,1,power_law_1.01,0.36937599182128905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,16,1,power_law_1.2,0.36764159202575686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,16,1,power_law_1.2,0.3758464097976685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,2,1,balanced,0.22952000300089517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,2,1,balanced,0.2295466661453247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,2,1,power_law_1.01,0.22440319061279296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,2,1,power_law_1.01,0.22488319873809814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,2,1,power_law_1.2,0.2306432008743286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,2,1,power_law_1.2,0.23274879455566405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,32,1,balanced,0.308896005153656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,32,1,balanced,0.31006399790445965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,32,1,power_law_1.01,0.3288127899169922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,32,1,power_law_1.01,0.33432960510253906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,32,1,power_law_1.2,0.3403520107269287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,32,1,power_law_1.2,0.341644811630249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,4,1,balanced,0.15229866902033487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,4,1,balanced,0.1525813341140747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,4,1,power_law_1.01,0.14922239780426025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,4,1,power_law_1.01,0.15002880096435547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,4,1,power_law_1.2,0.15356160402297975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,4,1,power_law_1.2,0.15368959903717042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,8,1,balanced,0.43830398718516034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,8,1,balanced,0.438752015431722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,8,1,power_law_1.01,0.4614975929260254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,8,1,power_law_1.01,0.46183037757873535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,8,1,power_law_1.2,0.47927041053771974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,2688,1856,6,128,8,1,power_law_1.2,0.491315221786499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,1,balanced,0.6330613295237223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,1,balanced,0.6353493531545004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,1,power_law_1.01,0.5889664173126221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,1,power_law_1.01,0.5904319763183594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,1,power_law_1.2,0.6047999858856201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,1,power_law_1.2,0.6099584102630615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,128,balanced,0.13019733627637228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,128,balanced,0.13168000181516012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,128,power_law_1.01,0.12997759580612184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,128,power_law_1.01,0.13006720542907715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,128,power_law_1.2,0.13073920011520385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,128,power_law_1.2,0.13127679824829103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,16,balanced,0.16481066743532816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,16,balanced,0.16569067041079202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,16,power_law_1.01,0.16658560037612916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,16,power_law_1.01,0.16864639520645142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,16,power_law_1.2,0.16830719709396363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,16,power_law_1.2,0.1709887981414795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,2,balanced,0.39582931995391846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,2,balanced,0.3970613479614258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,2,power_law_1.01,0.376857590675354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,2,power_law_1.01,0.37706880569458007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,2,power_law_1.2,0.3725055932998657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,2,power_law_1.2,0.37457919120788574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,256,balanced,0.12786666552225748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,256,balanced,0.12981333335240683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,256,power_law_1.01,0.1297152042388916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,256,power_law_1.01,0.13022719621658324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,256,power_law_1.2,0.12785919904708862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,256,power_law_1.2,0.12980480194091798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,32,balanced,0.14038933316866556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,32,balanced,0.14103999733924866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,32,power_law_1.01,0.13938560485839843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,32,power_law_1.01,0.14137599468231202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,32,power_law_1.2,0.14227839708328247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,32,power_law_1.2,0.1446463942527771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,4,balanced,0.26743467648824054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,4,balanced,0.26934399207433063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,4,power_law_1.01,0.2564863920211792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,4,power_law_1.01,0.25999999046325684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,4,power_law_1.2,0.262060809135437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,4,power_law_1.2,0.26620800495147706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,64,balanced,0.13395200173060098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,64,balanced,0.13435199856758118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,64,power_law_1.01,0.13397760391235353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,64,power_law_1.01,0.1342144012451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,64,power_law_1.2,0.13414399623870848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,64,power_law_1.2,0.1354688048362732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,8,balanced,0.19894399245580038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,8,balanced,0.1994453271230062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,8,power_law_1.01,0.19610879421234131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,8,power_law_1.01,0.20188159942626954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,8,power_law_1.2,0.20072319507598876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,1,8,power_law_1.2,0.20076799392700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,16,1,balanced,0.15152000387509665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,16,1,balanced,0.15194666385650635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,16,1,power_law_1.01,0.14695039987564087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,16,1,power_law_1.01,0.1474560022354126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,16,1,power_law_1.2,0.14942079782485962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,2,1,balanced,0.3654346863428752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,2,1,balanced,0.3655466636021932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,2,1,power_law_1.01,0.3428096055984497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,2,1,power_law_1.01,0.34408960342407224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,2,1,power_law_1.2,0.35050880908966064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,2,1,power_law_1.2,0.3529792070388794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,32,1,balanced,0.13007466991742453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,32,1,balanced,0.13128532965977988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,32,1,power_law_1.01,0.12700159549713136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,32,1,power_law_1.01,0.12773120403289795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,32,1,power_law_1.2,0.12940800189971924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,32,1,power_law_1.2,0.12979840040206908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,4,1,balanced,0.23639466365178427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,4,1,balanced,0.23640000820159912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,4,1,power_law_1.01,0.22346880435943603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,4,1,power_law_1.01,0.22691199779510499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,4,1,power_law_1.2,0.23054718971252441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,4,1,power_law_1.2,0.23070080280303956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,8,1,balanced,0.17421332995096842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,8,1,balanced,0.17470399538675943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,8,1,power_law_1.01,0.16821119785308838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,8,1,power_law_1.01,0.16984319686889648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,8,1,power_law_1.2,0.1710592031478882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,3072,1536,8,256,8,1,power_law_1.2,0.17159680128097535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,1,balanced,0.4322880109151204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,1,balanced,0.43380268414815265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,1,power_law_1.01,0.5196352005004883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,1,power_law_1.01,0.5197184085845947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,1,power_law_1.2,0.5176000118255615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,1,power_law_1.2,0.5262847900390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,2,balanced,0.26879467566808063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,2,balanced,0.27191466093063354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,2,power_law_1.01,0.32969601154327394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,2,power_law_1.01,0.3539711952209473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,2,power_law_1.2,0.3559103965759277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,2,power_law_1.2,0.38000640869140623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,4,balanced,0.2076639930407206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,4,balanced,0.20780267318089804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,4,power_law_1.01,0.24808320999145508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,4,power_law_1.01,0.2506432056427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,4,power_law_1.2,0.24638080596923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,4,power_law_1.2,0.25052800178527834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,8,balanced,0.18172266085942587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,8,balanced,0.18198400735855103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,8,power_law_1.01,0.21721599102020264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,8,power_law_1.01,0.22656641006469727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,8,power_law_1.2,0.22403199672698976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,1,8,power_law_1.2,0.22554240226745606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,16,1,balanced,0.06628799935181935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,16,1,balanced,0.06689600149790446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,16,1,power_law_1.01,0.06662399768829345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,16,1,power_law_1.01,0.0670527994632721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,16,1,power_law_1.2,0.06689280271530151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,16,1,power_law_1.2,0.06778879761695862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,2,1,balanced,0.23672000567118326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,2,1,balanced,0.2381653388341268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,2,1,power_law_1.01,0.2591808080673218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,2,1,power_law_1.01,0.26141440868377686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,2,1,power_law_1.2,0.2658560037612915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,2,1,power_law_1.2,0.2678976058959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,32,1,balanced,0.05045333504676819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,32,1,balanced,0.05402133365472158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,32,1,power_law_1.01,0.052185600996017455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,32,1,power_law_1.01,0.05377920269966126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,32,1,power_law_1.2,0.05244799852371216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,32,1,power_law_1.2,0.052742397785186766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,4,1,balanced,0.14086400469144186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,4,1,balanced,0.14281599720319113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,4,1,power_law_1.01,0.145907199382782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,4,1,power_law_1.01,0.14759039878845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,4,1,power_law_1.2,0.1468287944793701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,4,1,power_law_1.2,0.14835200309753419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,8,1,balanced,0.0939466655254364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,8,1,balanced,0.09597866733868916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,8,1,power_law_1.01,0.09567360281944275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,8,1,power_law_1.01,0.09745919704437256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,8,1,power_law_1.2,0.0974399983882904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,14336,2,8,8,1,power_law_1.2,0.09882240295410157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,1,balanced,0.4567573467890422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,1,balanced,0.4609973430633545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,1,power_law_1.01,0.4725759983062744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,1,power_law_1.01,0.4738431930541992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,1,power_law_1.2,0.48037118911743165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,1,power_law_1.2,0.488972806930542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,128,balanced,0.11272000273068745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,128,balanced,0.11289599537849426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,128,power_law_1.01,0.11311999559402466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,128,power_law_1.01,0.11402239799499511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,128,power_law_1.2,0.11437439918518066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,128,power_law_1.2,0.11538560390472412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,16,balanced,0.12549866239229837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,16,balanced,0.12557866175969443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,16,power_law_1.01,0.1356160044670105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,16,power_law_1.01,0.13729920387268066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,16,power_law_1.2,0.14165760278701783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,16,power_law_1.2,0.14357119798660278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,2,balanced,0.29480000336964923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,2,balanced,0.2974933385848999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,2,power_law_1.01,0.3053567886352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,2,power_law_1.01,0.30753920078277586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,2,power_law_1.2,0.3078464031219482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,2,power_law_1.2,0.3095936059951782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,32,balanced,0.11688533425331116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,32,balanced,0.11753599842389424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,32,power_law_1.01,0.12001279592514039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,32,power_law_1.01,0.1224128007888794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,32,power_law_1.2,0.12401280403137208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,32,power_law_1.2,0.12579200267791749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,4,balanced,0.2039946715037028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,4,balanced,0.20530666907628378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,4,power_law_1.01,0.21529600620269776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,4,power_law_1.01,0.2165247917175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,4,power_law_1.2,0.21333119869232178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,4,power_law_1.2,0.21422080993652343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,64,balanced,0.11424533526102702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,64,balanced,0.11590933799743652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,64,power_law_1.01,0.11787519454956055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,64,power_law_1.01,0.11824640035629272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,64,power_law_1.2,0.12002559900283813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,64,power_law_1.2,0.12098560333251954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,8,balanced,0.16049599647521973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,8,balanced,0.16084800163904825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,8,power_law_1.01,0.16254719495773315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,8,power_law_1.01,0.16824959516525267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,8,power_law_1.2,0.168614399433136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,1,8,power_law_1.2,0.17188479900360107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,16,1,balanced,0.12114666899045308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,16,1,balanced,0.12392533818880717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,16,1,power_law_1.01,0.1277119994163513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,16,1,power_law_1.01,0.12814719676971437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,16,1,power_law_1.2,0.12811520099639892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,16,1,power_law_1.2,0.12830079793930055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,2,1,balanced,0.2737119992574056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,2,1,balanced,0.2744479974110921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,2,1,power_law_1.01,0.2853440046310425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,2,1,power_law_1.01,0.2876032114028931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,2,1,power_law_1.2,0.28891520500183104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,2,1,power_law_1.2,0.2897471904754639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,32,1,balanced,0.11313600341478984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,32,1,balanced,0.1146399974822998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,32,1,power_law_1.01,0.11851520538330078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,32,1,power_law_1.01,0.11907839775085449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,32,1,power_law_1.2,0.11943039894104004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,32,1,power_law_1.2,0.1195520043373108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,4,1,balanced,0.18321067094802856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,4,1,balanced,0.18339200814565024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,4,1,power_law_1.01,0.19435520172119142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,4,1,power_law_1.01,0.19436800479888916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,4,1,power_law_1.2,0.19722239971160888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,4,1,power_law_1.2,0.19735039472579957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,8,1,balanced,0.14197867115338644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,8,1,balanced,0.14350933829943338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,8,1,power_law_1.01,0.1566655993461609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,8,1,power_law_1.01,0.156985604763031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,8,1,power_law_1.2,0.15809279680252075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,1536,8,128,8,1,power_law_1.2,0.15930240154266356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,1,balanced,2.9203093846639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,1,balanced,2.937941233317057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,1,power_law_1.01,2.7375808715820313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,1,power_law_1.01,2.8328447341918945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,1,power_law_1.2,2.8795520782470705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,1,power_law_1.2,2.93057918548584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,128,balanced,0.4202186663945516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,128,balanced,0.4205973148345947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,128,power_law_1.01,0.4257535934448242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,128,power_law_1.01,0.42778878211975097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,128,power_law_1.2,0.4331711769104004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,128,power_law_1.2,0.4347775936126709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,16,balanced,0.577450672785441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,16,balanced,0.5801599820454916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,16,power_law_1.01,0.5674623966217041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,16,power_law_1.01,0.5733888149261475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,16,power_law_1.2,0.5838784217834473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,16,power_law_1.2,0.5842559814453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,2,balanced,1.6375840504964192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,2,balanced,1.674191951751709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,2,power_law_1.01,1.601055908203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,2,power_law_1.01,1.6087743759155273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,2,power_law_1.2,1.6505151748657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,2,power_law_1.2,1.6608383178710937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,256,balanced,0.41836798191070557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,256,balanced,0.4199093182881673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,256,power_law_1.01,0.4215551853179932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,256,power_law_1.01,0.42203521728515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,256,power_law_1.2,0.4218111991882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,256,power_law_1.2,0.42446079254150393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,32,balanced,0.487770676612854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,32,balanced,0.4901546637217204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,32,power_law_1.01,0.48974080085754396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,32,power_law_1.01,0.49028477668762205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,32,power_law_1.2,0.4929920196533203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,32,power_law_1.2,0.5027584075927735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,4,balanced,1.0337440172831218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,4,balanced,1.0374186833699544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,4,power_law_1.01,1.0028223991394043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,4,power_law_1.01,1.0248831748962401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,4,power_law_1.2,1.034118366241455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,4,power_law_1.2,1.0457280158996582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,64,balanced,0.43826134999593097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,64,balanced,0.4391680161158244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,64,power_law_1.01,0.4525184154510498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,64,power_law_1.01,0.4534592151641846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,64,power_law_1.2,0.45840001106262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,64,power_law_1.2,0.45929598808288574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,8,balanced,0.7303199768066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,8,balanced,0.7331573168436686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,8,power_law_1.01,0.715123176574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,8,power_law_1.01,0.7296000003814698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,8,power_law_1.2,0.727948808670044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,1,8,power_law_1.2,0.7380352020263672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,16,1,balanced,2.351967970530192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,16,1,balanced,2.3532533645629883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,16,1,power_law_1.01,2.4307647705078126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,16,1,power_law_1.01,2.4332607269287108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,16,1,power_law_1.2,2.5835712432861326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,16,1,power_law_1.2,2.5962240219116213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,2,1,balanced,1.5166080792744954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,2,1,balanced,1.5482667287190754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,2,1,power_law_1.01,1.458176040649414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,2,1,power_law_1.01,1.4878016471862794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,2,1,power_law_1.2,1.5030783653259276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,2,1,power_law_1.2,1.5264320373535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,32,1,balanced,1.8330453236897786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,32,1,balanced,1.8331093788146973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,32,1,power_law_1.01,1.8963071823120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,32,1,power_law_1.01,1.918707275390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,32,1,power_law_1.2,2.0158336639404295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,32,1,power_law_1.2,2.0312576293945312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,4,1,balanced,0.8666026592254639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,4,1,balanced,0.8674879868825277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,4,1,power_law_1.01,0.8599616050720215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,4,1,power_law_1.01,0.8608063697814942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,4,1,power_law_1.2,0.8791680335998535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,4,1,power_law_1.2,0.8839615821838379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,8,1,balanced,0.556170662244161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,8,1,balanced,0.5566826661427816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,8,1,power_law_1.01,0.5594175815582275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,8,1,power_law_1.01,0.5664768218994141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,8,1,power_law_1.2,0.5700736045837402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,4096,2688,22,512,8,1,power_law_1.2,0.5749375820159912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,1,balanced,0.7026986281077067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,1,balanced,0.7089227040608724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,1,power_law_1.01,0.8793472290039063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,1,power_law_1.01,0.8808064460754395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,1,power_law_1.2,0.8294079780578614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,1,power_law_1.2,0.8379520416259766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,2,balanced,0.4057493209838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,2,balanced,0.4071466525395711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,2,power_law_1.01,0.5569983959197998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,2,power_law_1.01,0.5645055770874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,2,power_law_1.2,0.574502420425415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,2,power_law_1.2,0.6281792163848877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,4,balanced,0.26817599932352704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,4,balanced,0.2683359980583191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,4,power_law_1.01,0.35111041069030763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,4,power_law_1.01,0.35704960823059084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,4,power_law_1.2,0.3445120096206665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,4,power_law_1.2,0.36329600811004636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,8,balanced,0.225765327612559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,8,balanced,0.2290453314781189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,8,power_law_1.01,0.2877311944961548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,8,power_law_1.01,0.28784000873565674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,8,power_law_1.2,0.27269759178161623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,1,8,power_law_1.2,0.2990272045135498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,16,1,balanced,0.08684800068537395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,16,1,balanced,0.08871466914812724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,16,1,power_law_1.01,0.09288960099220275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,16,1,power_law_1.01,0.093094402551651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,16,1,power_law_1.2,0.08993279933929443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,16,1,power_law_1.2,0.09131519794464112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,2,1,balanced,0.34599467118581134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,2,1,balanced,0.34862399101257324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,2,1,power_law_1.01,0.42101759910583497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,2,1,power_law_1.01,0.4252352237701416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,2,1,power_law_1.2,0.41377921104431153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,2,1,power_law_1.2,0.42624640464782715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,32,1,balanced,0.07436266541481018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,32,1,balanced,0.07448000212510426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,32,1,power_law_1.01,0.07735679745674133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,32,1,power_law_1.01,0.07794560194015503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,32,1,power_law_1.2,0.07681279778480529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,32,1,power_law_1.2,0.07710719704627991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,4,1,balanced,0.19862399498621622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,4,1,balanced,0.20127467314402261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,4,1,power_law_1.01,0.230515193939209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,4,1,power_law_1.01,0.23169920444488526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,4,1,power_law_1.2,0.22617599964141846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,4,1,power_law_1.2,0.2271359920501709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,8,1,balanced,0.13052800297737122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,8,1,balanced,0.13194132844607034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,8,1,power_law_1.01,0.1352512001991272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,8,1,power_law_1.01,0.13879040479660035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,8,1,power_law_1.2,0.13651200532913207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,16384,2,8,8,1,power_law_1.2,0.13852159976959227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,1,balanced,1.6374986966451008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,1,balanced,1.643162727355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,1,power_law_1.01,1.4610048294067384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,1,power_law_1.01,1.4729344367980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,1,power_law_1.2,1.5079615592956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,1,power_law_1.2,1.56243839263916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,128,balanced,0.20680000384648642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,128,balanced,0.20742400487263998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,128,power_law_1.01,0.20776960849761963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,128,power_law_1.01,0.2087615966796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,128,power_law_1.2,0.2092992067337036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,128,power_law_1.2,0.21020159721374512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,16,balanced,0.2964319984118144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,16,balanced,0.2964959939320882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,16,power_law_1.01,0.2879807949066162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,16,power_law_1.01,0.2903872013092041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,16,power_law_1.2,0.29231359958648684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,16,power_law_1.2,0.29534718990325926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,2,balanced,0.9145066738128662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,2,balanced,0.9195466836293539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,2,power_law_1.01,0.8422080039978027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,2,power_law_1.01,0.8502592086791992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,2,power_law_1.2,0.8581119537353515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,2,power_law_1.2,0.881100845336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,256,balanced,0.2034613291422526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,256,balanced,0.2035199999809265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,256,power_law_1.01,0.20353279113769532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,256,power_law_1.01,0.2035968065261841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,256,power_law_1.2,0.2050879955291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,256,power_law_1.2,0.20570240020751954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,32,balanced,0.23539199431737265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,32,balanced,0.2363413373629252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,32,power_law_1.01,0.2391040086746216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,32,power_law_1.01,0.2397183895111084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,32,power_law_1.2,0.24571518898010253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,32,power_law_1.2,0.2463360071182251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,4,balanced,0.559002677599589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,4,balanced,0.5596640110015869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,4,power_law_1.01,0.5376192092895508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,4,power_law_1.01,0.5454336166381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,4,power_law_1.2,0.5475711822509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,4,power_law_1.2,0.550713586807251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,64,balanced,0.209498663743337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,64,balanced,0.21182399988174438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,64,power_law_1.01,0.21334400177001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,64,power_law_1.01,0.2134399890899658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,64,power_law_1.2,0.2161344051361084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,64,power_law_1.2,0.21943039894104005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,8,balanced,0.385103980700175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,8,balanced,0.3876533508300781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,8,power_law_1.01,0.3698944091796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,8,power_law_1.01,0.37128961086273193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,8,power_law_1.2,0.37090559005737306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,1,8,power_law_1.2,0.38078720569610597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,16,1,balanced,0.2725920081138611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,16,1,balanced,0.2732906738917033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,16,1,power_law_1.01,0.2649343967437744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,16,1,power_law_1.01,0.2660799980163574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,16,1,power_law_1.2,0.27107839584350585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,16,1,power_law_1.2,0.27150719165802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,2,1,balanced,0.8598293463389078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,2,1,balanced,0.8600587050120035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,2,1,power_law_1.01,0.779417610168457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,2,1,power_law_1.01,0.7866816043853759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,2,1,power_law_1.2,0.8113471984863281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,2,1,power_law_1.2,0.8223360061645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,32,1,balanced,0.23040533065795898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,32,1,balanced,0.23269333442052206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,32,1,power_law_1.01,0.225382399559021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,32,1,power_law_1.01,0.22597761154174806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,32,1,power_law_1.2,0.22850561141967773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,32,1,power_law_1.2,0.22877440452575684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,4,1,balanced,0.5007946491241455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,4,1,balanced,0.5017120043436686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,4,1,power_law_1.01,0.4778751850128174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,4,1,power_law_1.01,0.4815680027008057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,4,1,power_law_1.2,0.4788671970367432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,4,1,power_law_1.2,0.48670082092285155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,8,1,balanced,0.34413333733876544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,8,1,balanced,0.3449546496073405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,8,1,power_law_1.01,0.3308480024337769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,8,1,power_law_1.01,0.3330048084259033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,8,1,power_law_1.2,0.3378495931625366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2048,8,256,8,1,power_law_1.2,0.3391871929168701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,1,balanced,1.2927040259043376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,1,balanced,1.305466651916504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,1,power_law_1.01,1.2623104095458983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,1,power_law_1.01,1.2849023818969727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,1,power_law_1.2,1.325062370300293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,1,power_law_1.2,1.3252927780151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,16,balanced,0.25094934304555255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,16,balanced,0.2509866754213969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,16,power_law_1.01,0.25292799472808836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,16,power_law_1.01,0.25502719879150393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,16,power_law_1.2,0.2560447931289673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,16,power_law_1.2,0.2597055912017822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,2,balanced,0.7336266835530599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,2,balanced,0.7336853345235189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,2,power_law_1.01,0.7240575790405274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,2,power_law_1.01,0.7542463779449463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,2,power_law_1.2,0.7467008113861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,2,power_law_1.2,0.7690815925598145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,32,balanced,0.19535466035207114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,32,balanced,0.1957333286603292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,32,power_law_1.01,0.21190400123596193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,32,power_law_1.01,0.2149440050125122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,32,power_law_1.2,0.21804161071777345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,32,power_law_1.2,0.22865281105041504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,4,balanced,0.45812801520029706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,4,balanced,0.4591519832611084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,4,power_law_1.01,0.4705344200134277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,4,power_law_1.01,0.47178239822387696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,4,power_law_1.2,0.46662402153015137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,4,power_law_1.2,0.47907199859619143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,8,balanced,0.3195040027300517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,8,balanced,0.31986133257548016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,8,power_law_1.01,0.32753920555114746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,8,power_law_1.01,0.3281536102294922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,8,power_law_1.2,0.3308608055114746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,1,8,power_law_1.2,0.3314496040344238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,16,1,balanced,0.2291733423868815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,16,1,balanced,0.22924266258875528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,16,1,power_law_1.01,0.23123838901519775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,16,1,power_law_1.01,0.23223040103912354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,16,1,power_law_1.2,0.2347264051437378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,16,1,power_law_1.2,0.23505280017852784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,2,1,balanced,0.6973013083140055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,2,1,balanced,0.6981386343638102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,2,1,power_law_1.01,0.6969727993011474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,2,1,power_law_1.01,0.7054207801818848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,2,1,power_law_1.2,0.7115263938903809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,2,1,power_law_1.2,0.7143424034118653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,32,1,balanced,0.18372799952824911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,32,1,balanced,0.1850186586380005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,32,1,power_law_1.01,0.18946559429168702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,32,1,power_law_1.01,0.18977279663085939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,32,1,power_law_1.2,0.19111039638519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,32,1,power_law_1.2,0.1912832021713257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,4,1,balanced,0.4050026734670003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,4,1,balanced,0.40697065989176434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,4,1,power_law_1.01,0.4121535778045654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,4,1,power_law_1.01,0.4189568042755127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,4,1,power_law_1.2,0.42705278396606444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,4,1,power_law_1.2,0.42821760177612306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,8,1,balanced,0.269375999768575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,8,1,balanced,0.26942400137583417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,8,1,power_law_1.01,0.2869632005691528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,8,1,power_law_1.01,0.28898561000823975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,8,1,power_law_1.2,0.2916352033615112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,6144,2560,8,160,8,1,power_law_1.2,0.2932096004486084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,1,balanced,1.8927466074625652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,1,balanced,1.8999999364217122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,1,power_law_1.01,1.707846450805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,1,power_law_1.01,1.7397184371948242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,1,power_law_1.2,1.7669055938720704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,1,power_law_1.2,1.7867328643798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,128,balanced,0.22566932439804077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,128,balanced,0.2272640069325765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,128,power_law_1.01,0.2273535966873169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,128,power_law_1.01,0.2288383960723877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,128,power_law_1.2,0.22977280616760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,128,power_law_1.2,0.2311039924621582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,16,balanced,0.33581332365671795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,16,balanced,0.3361813227335612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,16,power_law_1.01,0.3186624050140381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,16,power_law_1.01,0.3231040000915527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,16,power_law_1.2,0.3213248014450073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,16,power_law_1.2,0.32391040325164794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,2,balanced,1.0490346749623616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,2,balanced,1.0515519777933757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,2,power_law_1.01,0.9833215713500977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,2,power_law_1.01,0.994655990600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,2,power_law_1.2,1.002131175994873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,2,power_law_1.2,1.0029376029968262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,256,balanced,0.222543994585673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,256,balanced,0.22410666942596436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,256,power_law_1.01,0.222489595413208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,256,power_law_1.01,0.22259199619293213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,256,power_law_1.2,0.22490239143371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,256,power_law_1.2,0.22500479221343994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,32,balanced,0.26316267251968384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,32,balanced,0.2645919919013977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,32,power_law_1.01,0.2605567932128906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,32,power_law_1.01,0.26917119026184083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,32,power_law_1.2,0.2715008020401001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,32,power_law_1.2,0.2742975950241089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,4,balanced,0.6353813409805298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,4,balanced,0.6364426612854004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,4,power_law_1.01,0.5990592002868652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,4,power_law_1.01,0.6101056098937988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,4,power_law_1.2,0.6215360164642334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,4,power_law_1.2,0.6361408233642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,64,balanced,0.23112533489863077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,64,balanced,0.23227733373641968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,64,power_law_1.01,0.23683199882507325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,64,power_law_1.01,0.2385279893875122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,64,power_law_1.2,0.24365439414978027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,64,power_law_1.2,0.24500479698181152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,8,balanced,0.4347626765569051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,8,balanced,0.4371360143025716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,8,power_law_1.01,0.42038397789001464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,8,power_law_1.01,0.4215424060821533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,8,power_law_1.2,0.4181503772735596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,1,8,power_law_1.2,0.42807679176330565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,16,1,balanced,0.3129013379414876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,16,1,balanced,0.31359465916951496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,16,1,power_law_1.01,0.30471680164337156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,16,1,power_law_1.01,0.3050368070602417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,16,1,power_law_1.2,0.30883839130401614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,16,1,power_law_1.2,0.31108479499816893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,2,1,balanced,0.994698683420817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,2,1,balanced,1.0051093101501465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,2,1,power_law_1.01,0.9112192153930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,2,1,power_law_1.01,0.9242367744445801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,2,1,power_law_1.2,0.932044792175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,2,1,power_law_1.2,0.949062442779541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,32,1,balanced,0.26291199525197345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,32,1,balanced,0.26366933186848956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,32,1,power_law_1.01,0.2582655906677246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,32,1,power_law_1.01,0.2592576026916504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,32,1,power_law_1.2,0.25840001106262206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,32,1,power_law_1.2,0.26149759292602537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,4,1,balanced,0.5804959932963053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,4,1,balanced,0.5827146768569946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,4,1,power_law_1.01,0.5472000122070313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,4,1,power_law_1.01,0.5529151916503906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,4,1,power_law_1.2,0.5567872047424316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,4,1,power_law_1.2,0.5625408172607422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,8,1,balanced,0.397765318552653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,8,1,balanced,0.3996373414993286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,8,1,power_law_1.01,0.3816767930984497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,8,1,power_law_1.01,0.38368000984191897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,8,1,power_law_1.2,0.38382079601287844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,256,8,1,power_law_1.2,0.38886399269104005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,1,balanced,2.9016478856404624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,1,balanced,2.972655932108561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,1,power_law_1.01,2.3393152236938475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,1,power_law_1.01,2.3557376861572266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,1,power_law_1.2,2.3863040924072267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,1,power_law_1.2,2.402463912963867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,128,balanced,0.28757333755493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,128,balanced,0.2876586715380351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,128,power_law_1.01,0.2846400022506714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,128,power_law_1.01,0.2871040105819702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,128,power_law_1.2,0.28952319622039796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,128,power_law_1.2,0.2905407905578613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,16,balanced,0.43356800079345703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,16,balanced,0.435696005821228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,16,power_law_1.01,0.4151296138763428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,16,power_law_1.01,0.423583984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,16,power_law_1.2,0.4112192153930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,16,power_law_1.2,0.4151103973388672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,2,balanced,1.5168372790018718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,2,balanced,1.5356532732645671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,2,power_law_1.01,1.286515235900879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,2,power_law_1.01,1.3323072433471679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,2,power_law_1.2,1.2875519752502442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,2,power_law_1.2,1.3602304458618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,32,balanced,0.34965864817301434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,32,balanced,0.3516000111897786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,32,power_law_1.01,0.333407998085022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,32,power_law_1.01,0.35002880096435546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,32,power_law_1.2,0.3400896072387695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,32,power_law_1.2,0.34787840843200685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,4,balanced,0.8992106914520264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,4,balanced,0.8999626636505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,4,power_law_1.01,0.8041472434997559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,4,power_law_1.01,0.8582783699035644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,4,power_law_1.2,0.8071423530578613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,4,power_law_1.2,0.8562944412231446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,64,balanced,0.3001120090484619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,64,balanced,0.30052800973256427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,64,power_law_1.01,0.297760009765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,64,power_law_1.01,0.30072319507598877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,64,power_law_1.2,0.304915189743042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,64,power_law_1.2,0.30869760513305666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,8,balanced,0.5920106569925944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,8,balanced,0.5926026503245035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,8,power_law_1.01,0.5511104106903076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,8,power_law_1.01,0.5627520084381104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,8,power_law_1.2,0.5554368019104003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,1,8,power_law_1.2,0.5580543994903564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,16,1,balanced,0.4063680171966553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,16,1,balanced,0.40642134348551434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,16,1,power_law_1.01,0.37639679908752444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,16,1,power_law_1.01,0.37651839256286623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,16,1,power_law_1.2,0.37851519584655763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,16,1,power_law_1.2,0.3791359901428223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,2,1,balanced,1.4293546676635742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,2,1,balanced,1.490272045135498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,2,1,power_law_1.01,1.2218560218811034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,2,1,power_law_1.01,1.2310336112976075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,2,1,power_law_1.2,1.228927993774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,2,1,power_law_1.2,1.2319168090820312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,32,1,balanced,0.3521226644515991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,32,1,balanced,0.35283199946085614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,32,1,power_law_1.01,0.3230720043182373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,32,1,power_law_1.01,0.3249151945114136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,32,1,power_law_1.2,0.33073279857635496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,32,1,power_law_1.2,0.33207039833068847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,4,1,balanced,0.8191359837849935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,4,1,balanced,0.821173350016276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,4,1,power_law_1.01,0.7202367782592773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,4,1,power_law_1.01,0.7235392093658447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,4,1,power_law_1.2,0.7207615852355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,4,1,power_law_1.2,0.7454336166381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,8,1,balanced,0.5454453229904175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,8,1,balanced,0.5471306641896566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,8,1,power_law_1.01,0.4866879940032959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,8,1,power_law_1.01,0.4902207851409912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,8,1,power_law_1.2,0.49572482109069826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,512,7168,2048,8,384,8,1,power_law_1.2,0.5066944122314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,1,balanced,0.6167093515396118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,1,balanced,0.6175626516342163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,1,power_law_1.01,0.6711487770080566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,1,power_law_1.01,0.6803008079528808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,1,power_law_1.2,0.6798655986785889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,1,power_law_1.2,0.6907519817352294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,128,balanced,0.3642666737238566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,128,balanced,0.3654293219248454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,128,power_law_1.01,0.3819648027420044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,128,power_law_1.01,0.3837120056152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,128,power_law_1.2,0.39397759437561036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,128,power_law_1.2,0.3977407932281494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,16,balanced,0.38156267007191974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,16,balanced,0.3819626569747925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,16,power_law_1.01,0.40134401321411134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,16,power_law_1.01,0.4092544078826904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,16,power_law_1.2,0.4121664047241211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,16,power_law_1.2,0.4177728176116943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,2,balanced,0.5191520055135092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,2,balanced,0.5215679804484049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,2,power_law_1.01,0.5612415790557861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,2,power_law_1.01,0.5661439895629883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,2,power_law_1.2,0.5665408134460449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,2,power_law_1.2,0.5903103828430176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,32,balanced,0.370192011197408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,32,balanced,0.3709919850031535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,32,power_law_1.01,0.39410560131072997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,32,power_law_1.01,0.3948415994644165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,32,power_law_1.2,0.40453758239746096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,32,power_law_1.2,0.4054399967193604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,4,balanced,0.43731733163197833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,4,balanced,0.4416639804840088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,4,power_law_1.01,0.4788991928100586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,4,power_law_1.01,0.4789120197296143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,4,power_law_1.2,0.49258880615234374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,4,power_law_1.2,0.493990421295166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,64,balanced,0.3665013313293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,64,balanced,0.367520014444987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,64,power_law_1.01,0.379366397857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,64,power_law_1.01,0.3871104001998901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,64,power_law_1.2,0.40102400779724123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,64,power_law_1.2,0.4035776138305664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,8,balanced,0.40001598993937176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,8,balanced,0.4016000032424927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,8,power_law_1.01,0.4299776077270508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,8,power_law_1.01,0.43227519989013674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,8,power_law_1.2,0.4401535987854004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,1,8,power_law_1.2,0.4406015872955322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,2,1,balanced,0.43666664759318036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,2,1,balanced,0.43908798694610596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,2,1,power_law_1.01,0.47788162231445314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,2,1,power_law_1.01,0.48044800758361816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,2,1,power_law_1.2,0.4832128047943115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,2,1,power_law_1.2,0.48336639404296877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,4,1,balanced,0.3660106658935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,4,1,balanced,0.3696213165918986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,4,1,power_law_1.01,0.39907839298248293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,4,1,power_law_1.01,0.4015103816986084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,4,1,power_law_1.2,0.40320639610290526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2048,768,8,128,4,1,power_law_1.2,0.40355839729309084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,1,balanced,1.2048213481903076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,1,balanced,1.228543996810913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,1,power_law_1.01,1.221446418762207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,1,power_law_1.01,1.2314111709594726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,1,power_law_1.2,1.2529024124145507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,1,power_law_1.2,1.2622655868530273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,128,balanced,0.4693439801534017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,128,balanced,0.4713066816329956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,128,power_law_1.01,0.5032256126403809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,128,power_law_1.01,0.5067903995513916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,128,power_law_1.2,0.5370560169219971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,128,power_law_1.2,0.5478335857391358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,16,balanced,0.5174880027770996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,16,balanced,0.5188373327255249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,16,power_law_1.01,0.5577919960021973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,16,power_law_1.01,0.5586495876312256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,16,power_law_1.2,0.5862656116485596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,16,power_law_1.2,0.5922111988067627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,2,balanced,0.8634506861368815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,2,balanced,0.865834633509318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,2,power_law_1.01,0.9102656364440918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,2,power_law_1.01,0.924294376373291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,2,power_law_1.2,0.9096128463745117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,2,power_law_1.2,0.9230400085449219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,32,balanced,0.49083733558654785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,32,balanced,0.4917493263880412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,32,power_law_1.01,0.52641282081604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,32,power_law_1.01,0.5277440071105957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,32,power_law_1.2,0.543398380279541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,32,power_law_1.2,0.5538559913635254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,4,balanced,0.6765387058258057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,4,balanced,0.6803946495056152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,4,power_law_1.01,0.7013504028320312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,4,power_law_1.01,0.7285823822021484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,4,power_law_1.2,0.7322944164276123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,4,power_law_1.2,0.7324800014495849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,64,balanced,0.4771999915440877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,64,balanced,0.4779680172602336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,64,power_law_1.01,0.5127808094024658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,64,power_law_1.01,0.5254335880279541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,64,power_law_1.2,0.5410687923431396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,64,power_law_1.2,0.5444159984588623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,8,balanced,0.5721760193506876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,8,balanced,0.572218656539917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,8,power_law_1.01,0.6155263900756835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,8,power_law_1.01,0.63155198097229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,8,power_law_1.2,0.6274240016937256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,1,8,power_law_1.2,0.6732351779937744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,16,1,balanced,2.281007925669352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,16,1,balanced,2.2844799359639487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,16,1,power_law_1.01,2.1888959884643553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,16,1,power_law_1.01,2.200032043457031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,16,1,power_law_1.2,2.222707176208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,16,1,power_law_1.2,2.2321151733398437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,2,1,balanced,0.7792747020721436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,2,1,balanced,0.782538652420044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,2,1,power_law_1.01,0.780947208404541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,2,1,power_law_1.01,0.7835455894470215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,2,1,power_law_1.2,0.7987135887145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,2,1,power_law_1.2,0.7990079879760742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,32,1,balanced,1.9815999666849773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,32,1,balanced,1.989690621693929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,32,1,power_law_1.01,1.9414207458496093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,32,1,power_law_1.01,1.9464704513549804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,32,1,power_law_1.2,1.9728448867797852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,32,1,power_law_1.2,1.9932479858398438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,4,1,balanced,0.5629280010859171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,4,1,balanced,0.564357320467631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,4,1,power_law_1.01,0.5605631828308105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,4,1,power_law_1.01,0.5643328189849853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,4,1,power_law_1.2,0.5704639911651611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,4,1,power_law_1.2,0.5721792221069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,8,1,balanced,2.9933547973632812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,8,1,balanced,3.0162986119588218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,8,1,power_law_1.01,2.8717056274414063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,8,1,power_law_1.01,2.9994239807128906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,8,1,power_law_1.2,2.9930240631103517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,2688,1856,6,128,8,1,power_law_1.2,2.999679946899414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,1,balanced,1.5814293225606282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,1,balanced,1.587216059366862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,1,power_law_1.01,1.6706239700317382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,1,power_law_1.01,1.6778432846069335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,1,power_law_1.2,1.7125888824462892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,1,power_law_1.2,1.725503921508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,128,balanced,0.5607839822769165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,128,balanced,0.5610719919204712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,128,power_law_1.01,0.5917312145233155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,128,power_law_1.01,0.5933504104614258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,128,power_law_1.2,0.6052800178527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,128,power_law_1.2,0.6079103946685791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,16,balanced,0.6253493229548136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,16,balanced,0.6289653380711874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,16,power_law_1.01,0.6703872203826904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,16,power_law_1.01,0.6749887943267823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,16,power_law_1.2,0.679699182510376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,16,power_law_1.2,0.6915264129638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,2,balanced,1.105946699778239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,2,balanced,1.1094133059183757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,2,power_law_1.01,1.1765952110290527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,2,power_law_1.01,1.1805760383605957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,2,power_law_1.2,1.2048192024230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,2,power_law_1.2,1.262713623046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,256,balanced,0.5561333497365316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,256,balanced,0.5584959983825684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,256,power_law_1.01,0.5793471813201905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,256,power_law_1.01,0.5806528091430664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,256,power_law_1.2,0.5922815799713135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,256,power_law_1.2,0.5979904174804688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,32,balanced,0.5889600118001302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,32,balanced,0.5893866618474325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,32,power_law_1.01,0.6199295997619629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,32,power_law_1.01,0.6262847900390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,32,power_law_1.2,0.6570496082305908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,32,power_law_1.2,0.6633664131164551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,4,balanced,0.8340213298797607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,4,balanced,0.8379680315653483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,4,power_law_1.01,0.8929792404174804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,4,power_law_1.01,0.9044544219970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,4,power_law_1.2,0.9220288276672364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,4,power_law_1.2,0.9442432403564454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,64,balanced,0.5701333284378052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,64,balanced,0.5704106489817301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,64,power_law_1.01,0.5949632167816162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,64,power_law_1.01,0.5987840175628663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,64,power_law_1.2,0.6178175926208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,64,power_law_1.2,0.6233215808868409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,8,balanced,0.7006080150604248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,8,balanced,0.7044106324513754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,8,power_law_1.01,0.7426239967346191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,8,power_law_1.01,0.7443967819213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,8,power_law_1.2,0.7777984142303467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,1,8,power_law_1.2,0.7851263999938964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,16,1,balanced,0.5114293495814005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,16,1,balanced,0.5129813353220621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,16,1,power_law_1.01,0.5337664127349854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,16,1,power_law_1.01,0.5367424011230468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,16,1,power_law_1.2,0.5406015872955322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,16,1,power_law_1.2,0.5426239967346191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,2,1,balanced,1.0029813448588054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,2,1,balanced,1.0040106773376465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,2,1,power_law_1.01,1.054246425628662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,2,1,power_law_1.01,1.0562432289123536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,2,1,power_law_1.2,1.0753087997436523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,2,1,power_law_1.2,1.0874367713928224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,32,1,balanced,0.47597332795461017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,32,1,balanced,0.4764853318532308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,32,1,power_law_1.01,0.4937280178070068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,32,1,power_law_1.01,0.495743989944458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,32,1,power_law_1.2,0.5036736011505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,32,1,power_law_1.2,0.5037824153900147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,4,1,balanced,0.7047200202941895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,4,1,balanced,0.7074346542358398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,4,1,power_law_1.01,0.7367551803588868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,4,1,power_law_1.01,0.7390912055969239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,4,1,power_law_1.2,0.748364782333374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,4,1,power_law_1.2,0.7499904155731201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,8,1,balanced,0.583413322766622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,8,1,balanced,0.5835626522699991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,8,1,power_law_1.01,0.6024064064025879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,8,1,power_law_1.01,0.6036479949951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,8,1,power_law_1.2,0.6098048210144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,3072,1536,8,256,8,1,power_law_1.2,0.612275218963623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,1,balanced,2.8909174601236978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,1,balanced,2.931898752848307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,1,power_law_1.01,2.720716857910156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,1,power_law_1.01,2.8534400939941404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,1,power_law_1.2,2.762771224975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,1,power_law_1.2,2.7857343673706056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,2,balanced,1.7767200469970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,2,balanced,1.7864054044087727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,2,power_law_1.01,2.08591365814209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,2,power_law_1.01,2.1539392471313477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,2,power_law_1.2,2.1025856018066404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,2,power_law_1.2,2.2243200302124024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,4,balanced,1.2429973284403484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,4,balanced,1.2542186578114827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,4,power_law_1.01,1.862054443359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,4,power_law_1.01,1.8744192123413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,4,power_law_1.2,1.8212608337402343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,4,power_law_1.2,1.8401151657104493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,8,balanced,1.0211199919382732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,8,balanced,1.0231146812438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,8,power_law_1.01,1.5711551666259767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,8,power_law_1.01,1.7169408798217773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,8,power_law_1.2,1.6384063720703126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,1,8,power_law_1.2,1.7737152099609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,16,1,balanced,0.30370134115219116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,16,1,balanced,0.3040906588236491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,16,1,power_law_1.01,0.30833280086517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,16,1,power_law_1.01,0.30872321128845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,16,1,power_law_1.2,0.3117439985275269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,16,1,power_law_1.2,0.31214079856872556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,2,1,balanced,1.4180213610331218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,2,1,balanced,1.4205172856648762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,2,1,power_law_1.01,1.4211071968078612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,2,1,power_law_1.01,1.460979175567627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,2,1,power_law_1.2,1.428268814086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,2,1,power_law_1.2,1.432159996032715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,32,1,balanced,0.24014933904012045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,32,1,balanced,0.2413653333981832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,32,1,power_law_1.01,0.24265599250793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,32,1,power_law_1.01,0.2435391902923584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,32,1,power_law_1.2,0.24606719017028808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,32,1,power_law_1.2,0.24928638935089112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,4,1,balanced,0.7556906541188558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,4,1,balanced,0.7776266733805338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,4,1,power_law_1.01,0.7654143810272217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,4,1,power_law_1.01,0.7738815784454346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,4,1,power_law_1.2,0.7590015888214111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,4,1,power_law_1.2,0.7748672008514405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,8,1,balanced,0.4461493492126465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,8,1,balanced,0.45205867290496826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,8,1,power_law_1.01,0.4555391788482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,8,1,power_law_1.01,0.4601280212402344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,8,1,power_law_1.2,0.46109437942504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,14336,2,8,8,1,power_law_1.2,0.4641024112701416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,1,balanced,1.5524266560872395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,1,balanced,1.5870933532714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,1,power_law_1.01,1.750111961364746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,1,power_law_1.01,1.7592960357666017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,1,power_law_1.2,1.7601663589477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,1,power_law_1.2,1.7638208389282226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,128,balanced,0.6050613323847452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,128,balanced,0.6066986719767252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,128,power_law_1.01,0.6578176021575928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,128,power_law_1.01,0.6597504138946533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,128,power_law_1.2,0.6990015983581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,128,power_law_1.2,0.7015552043914794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,16,balanced,0.6646080017089844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,16,balanced,0.666650652885437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,16,power_law_1.01,0.7481728076934815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,16,power_law_1.01,0.7715904235839843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,16,power_law_1.2,0.7675456047058106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,16,power_law_1.2,0.8006719589233399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,2,balanced,1.1282026767730713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,2,balanced,1.1288800239562988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,2,power_law_1.01,1.2662912368774415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,2,power_law_1.01,1.281670379638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,2,power_law_1.2,1.2838784217834474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,2,power_law_1.2,1.2995583534240722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,32,balanced,0.6312319835027059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,32,balanced,0.632751981417338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,32,power_law_1.01,0.7020095825195313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,32,power_law_1.01,0.703443193435669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,32,power_law_1.2,0.7477439880371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,32,power_law_1.2,0.7498496055603028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,4,balanced,0.8729279836018881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,4,balanced,0.8732960224151611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,4,power_law_1.01,0.979980754852295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,4,power_law_1.01,1.009836769104004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,4,power_law_1.2,1.0310272216796874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,4,power_law_1.2,1.044115161895752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,64,balanced,0.6121386686960856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,64,balanced,0.6127093235651652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,64,power_law_1.01,0.6686912059783936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,64,power_law_1.01,0.6884031772613526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,64,power_law_1.2,0.7069439888000488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,64,power_law_1.2,0.7285568237304687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,8,balanced,0.7326026757558187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,8,balanced,0.7356266975402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,8,power_law_1.01,0.8185407638549804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,8,power_law_1.01,0.8438015937805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,8,power_law_1.2,0.8761983871459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,1,8,power_law_1.2,0.900108814239502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,16,1,balanced,0.5516000191370646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,16,1,balanced,0.5523946682612101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,16,1,power_law_1.01,0.5994048118591309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,16,1,power_law_1.01,0.6002240180969238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,16,1,power_law_1.2,0.6057216167449951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,16,1,power_law_1.2,0.6070464134216309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,2,1,balanced,1.0125866731007893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,2,1,balanced,1.0155733426411946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,2,1,power_law_1.01,1.1155776023864745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,2,1,power_law_1.01,1.1174912452697754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,2,1,power_law_1.2,1.132364845275879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,2,1,power_law_1.2,1.1328191757202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,32,1,balanced,0.5258293151855469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,32,1,balanced,0.5274133284886678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,32,1,power_law_1.01,0.5616511821746826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,32,1,power_law_1.01,0.5628992080688476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,32,1,power_law_1.2,0.5655935764312744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,32,1,power_law_1.2,0.5675583839416504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,4,1,balanced,0.7276000181833903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,4,1,balanced,0.7295786539713541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,4,1,power_law_1.01,0.7960576057434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,4,1,power_law_1.01,0.8000639915466309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,4,1,power_law_1.2,0.8027199745178223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,4,1,power_law_1.2,0.8030655860900879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,8,1,balanced,0.61134934425354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,8,1,balanced,0.6118880112965902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,8,1,power_law_1.01,0.658892822265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,8,1,power_law_1.01,0.6633535861968994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,8,1,power_law_1.2,0.6666111946105957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,1536,8,128,8,1,power_law_1.2,0.6670720100402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,1,balanced,10.096005121866861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,1,balanced,9.925135930379232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,1,power_law_1.01,9.029248046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,1,power_law_1.01,9.114694213867187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,1,power_law_1.2,9.178329467773438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,1,power_law_1.2,9.259474945068359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,128,balanced,2.1752212842305503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,128,balanced,2.1763200759887695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,128,power_law_1.01,2.260371208190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,128,power_law_1.01,2.267769622802734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,128,power_law_1.2,2.304742431640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,128,power_law_1.2,2.3314943313598633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,16,balanced,2.548917293548584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,16,balanced,2.55948797861735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,16,power_law_1.01,2.6711679458618165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,16,power_law_1.01,2.683366394042969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,16,power_law_1.2,2.7293888092041017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,16,power_law_1.2,2.8135040283203123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,2,balanced,5.720309575398763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,2,balanced,5.8082930246988935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,2,power_law_1.01,5.569190216064453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,2,power_law_1.01,5.644992065429688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,2,power_law_1.2,5.808127975463867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,2,power_law_1.2,5.872140884399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,256,balanced,2.1489814122517905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,256,balanced,2.149493376413981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,256,power_law_1.01,2.219500732421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,256,power_law_1.01,2.2243776321411133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,256,power_law_1.2,2.2901119232177733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,256,power_law_1.2,2.2902399063110352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,32,balanced,2.335007985432943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,32,balanced,2.347434679667155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,32,power_law_1.01,2.4518911361694338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,32,power_law_1.01,2.459116744995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,32,power_law_1.2,2.5356735229492187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,32,power_law_1.2,2.5508800506591798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,4,balanced,3.7658987045288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,4,balanced,3.794528007507324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,4,power_law_1.01,3.826131057739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,4,power_law_1.01,3.8779006958007813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,4,power_law_1.2,3.971692657470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,4,power_law_1.2,3.986943817138672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,64,balanced,2.229311943054199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,64,balanced,2.229530652364095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,64,power_law_1.01,2.336172866821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,64,power_law_1.01,2.342963218688965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,64,power_law_1.2,2.3884735107421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,64,power_law_1.2,2.4414464950561525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,8,balanced,2.958101272583008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,8,balanced,2.964821179707845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,8,power_law_1.01,3.084480094909668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,8,power_law_1.01,3.1396799087524414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,8,power_law_1.2,3.1967872619628905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,1,8,power_law_1.2,3.286649703979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,16,1,balanced,16.246810913085938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,16,1,balanced,16.409386952718098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,16,1,power_law_1.01,15.781178283691407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,16,1,power_law_1.01,15.78522186279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,16,1,power_law_1.2,16.070611572265626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,16,1,power_law_1.2,16.209625244140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,2,1,balanced,5.352912267049153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,2,1,balanced,5.3668638865153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,2,1,power_law_1.01,5.01591682434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,2,1,power_law_1.01,5.078092956542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,2,1,power_law_1.2,5.088966369628906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,2,1,power_law_1.2,5.142099380493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,32,1,balanced,11.65002695719401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,32,1,balanced,12.002245585123697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,32,1,power_law_1.01,10.976812744140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,32,1,power_law_1.01,11.000281524658202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,32,1,power_law_1.2,11.183379364013671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,32,1,power_law_1.2,11.205017852783204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,4,1,balanced,3.3298721313476562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,4,1,balanced,3.3367945353190103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,4,1,power_law_1.01,3.160940742492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,4,1,power_law_1.01,3.1766271591186523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,4,1,power_law_1.2,3.1637504577636717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,4,1,power_law_1.2,3.194803237915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,8,1,balanced,2.3473386764526367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,8,1,balanced,2.363797346750895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,8,1,power_law_1.01,2.22357120513916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,8,1,power_law_1.01,2.2350271224975584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,8,1,power_law_1.2,2.266316795349121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,4096,2688,22,512,8,1,power_law_1.2,2.279539108276367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,1,balanced,4.535733222961426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,1,balanced,4.542064030965169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,1,power_law_1.01,4.574899291992187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,1,power_law_1.01,4.655180740356445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,1,power_law_1.2,4.475033569335937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,1,power_law_1.2,4.534815979003906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,2,balanced,2.6238293647766113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,2,balanced,2.6453493436177573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,2,power_law_1.01,3.14849910736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,2,power_law_1.01,4.021139144897461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,2,power_law_1.2,3.3888126373291017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,2,power_law_1.2,3.7827007293701174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,4,balanced,1.6652906735738118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,4,balanced,1.6861173311869304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,4,power_law_1.01,2.584448051452637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,4,power_law_1.01,2.651424026489258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,4,power_law_1.2,2.696563148498535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,4,power_law_1.2,2.9785024642944338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,8,balanced,1.2673226992289226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,8,balanced,1.2733973662058513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,8,power_law_1.01,2.380633544921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,8,power_law_1.01,2.4903488159179688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,8,power_law_1.2,2.4050111770629883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,1,8,power_law_1.2,2.485843276977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,16,1,balanced,0.45338133970896405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,16,1,balanced,0.4541333516438802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,16,1,power_law_1.01,0.4567039966583252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,16,1,power_law_1.01,0.45780482292175295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,16,1,power_law_1.2,0.4557504177093506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,16,1,power_law_1.2,0.4593599796295166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,2,1,balanced,2.2193759282430015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,2,1,balanced,2.226384003957113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,2,1,power_law_1.01,2.251910400390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,2,1,power_law_1.01,2.293408012390137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,2,1,power_law_1.2,2.2662464141845704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,2,1,power_law_1.2,2.2770879745483397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,32,1,balanced,0.3330026666323344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,32,1,balanced,0.33613868554433185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,32,1,power_law_1.01,0.34047999382019045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,32,1,power_law_1.01,0.34170238971710204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,32,1,power_law_1.2,0.3388159990310669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,32,1,power_law_1.2,0.3404416084289551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,4,1,balanced,1.1810452938079834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,4,1,balanced,1.1980960369110107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,4,1,power_law_1.01,1.2115391731262206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,4,1,power_law_1.01,1.2253503799438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,4,1,power_law_1.2,1.208083152770996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,4,1,power_law_1.2,1.2290559768676759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,8,1,balanced,0.6836960315704346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,8,1,balanced,0.6911839644114176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,8,1,power_law_1.01,0.6955327987670898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,8,1,power_law_1.01,0.6996032238006592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,8,1,power_law_1.2,0.6942080020904541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,16384,2,8,8,1,power_law_1.2,0.6994944095611573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,1,balanced,3.8718560536702475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,1,balanced,3.993962605794271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,1,power_law_1.01,3.940883255004883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,1,power_law_1.01,4.049023818969727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,1,power_law_1.2,4.157318496704102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,1,power_law_1.2,4.177964782714843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,128,balanced,0.8899253209431967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,128,balanced,0.8906346956888834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,128,power_law_1.01,0.9489343643188477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,128,power_law_1.01,0.962399959564209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,128,power_law_1.2,0.9878527641296386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,128,power_law_1.2,0.9926655769348145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,16,balanced,1.0526933670043945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,16,balanced,1.0547626813252766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,16,power_law_1.01,1.1518848419189454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,16,power_law_1.01,1.1774656295776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,16,power_law_1.2,1.1917695999145508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,16,power_law_1.2,1.1934335708618165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,2,balanced,2.309552033742269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,2,balanced,2.363248030344645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,2,power_law_1.01,2.4860416412353517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,2,power_law_1.01,2.5156671524047853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,2,power_law_1.2,2.5579456329345702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,2,power_law_1.2,2.5880512237548827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,256,balanced,0.8806773026784261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,256,balanced,0.8816800117492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,256,power_law_1.01,0.9345343589782715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,256,power_law_1.01,0.93569917678833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,256,power_law_1.2,0.9930303573608399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,256,power_law_1.2,0.9970047950744629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,32,balanced,0.9611093203226725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,32,balanced,0.9641280174255371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,32,power_law_1.01,1.036780834197998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,32,power_law_1.01,1.0369471549987792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,32,power_law_1.2,1.098367977142334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,32,power_law_1.2,1.1096256256103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,4,balanced,1.5915466944376628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,4,balanced,1.6033013661702473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,4,power_law_1.01,1.7208896636962892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,4,power_law_1.01,1.742905616760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,4,power_law_1.2,1.7574335098266602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,4,power_law_1.2,1.8396928787231446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,64,balanced,0.9154720306396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,64,balanced,0.9170080025990804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,64,power_law_1.01,0.9812416076660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,64,power_law_1.01,0.9917119979858399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,64,power_law_1.2,1.0509440422058105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,64,power_law_1.2,1.0622464179992677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,8,balanced,1.2271946271260579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,8,balanced,1.2372852961222331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,8,power_law_1.01,1.3778559684753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,8,power_law_1.01,1.3958592414855957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,8,power_law_1.2,1.4276479721069335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,1,8,power_law_1.2,1.429152011871338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,16,1,balanced,0.910271962483724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,16,1,balanced,0.9121973514556885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,16,1,power_law_1.01,0.9398591995239258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,16,1,power_law_1.01,0.9409664154052735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,16,1,power_law_1.2,0.9495295524597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,16,1,power_law_1.2,0.9581760406494141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,2,1,balanced,2.124394734700521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,2,1,balanced,2.165226618448893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,2,1,power_law_1.01,2.2528575897216796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,2,1,power_law_1.01,2.2689983367919924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,2,1,power_law_1.2,2.293619155883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,2,1,power_law_1.2,2.3192895889282226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,32,1,balanced,0.8369332949320475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,32,1,balanced,0.837440013885498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,32,1,power_law_1.01,0.8638976097106934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,32,1,power_law_1.01,0.8654335975646973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,32,1,power_law_1.2,0.8738559722900391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,32,1,power_law_1.2,0.8755071640014649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,4,1,balanced,1.4009920756022136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,4,1,balanced,1.4061226844787598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,4,1,power_law_1.01,1.4770432472229005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,4,1,power_law_1.01,1.484659194946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,4,1,power_law_1.2,1.5006208419799805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,4,1,power_law_1.2,1.5057472229003905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,8,1,balanced,1.0679466724395752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,8,1,balanced,1.0703413486480713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,8,1,power_law_1.01,1.1129664421081542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,8,1,power_law_1.01,1.1185407638549805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,8,1,power_law_1.2,1.129862403869629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2048,8,256,8,1,power_law_1.2,1.133561611175537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,1,balanced,4.417509396870931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,1,balanced,4.622709274291992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,1,power_law_1.01,4.015379333496094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,1,power_law_1.01,4.067763137817383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,1,power_law_1.2,3.9945663452148437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,1,power_law_1.2,4.284185409545898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,16,balanced,1.1080479621887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,16,balanced,1.11189866065979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,16,power_law_1.01,1.248204803466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,16,power_law_1.01,1.2827967643737792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,16,power_law_1.2,1.355795192718506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,16,power_law_1.2,1.369491195678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,2,balanced,2.4971307118733725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,2,balanced,2.641695976257324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,2,power_law_1.01,2.550457572937012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,2,power_law_1.01,2.6619840621948243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,2,power_law_1.2,2.6267648696899415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,2,power_law_1.2,2.6839040756225585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,32,balanced,1.0075573126475017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,32,balanced,1.008239984512329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,32,power_law_1.01,1.124403190612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,32,power_law_1.01,1.1371392250061034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,32,power_law_1.2,1.232857608795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,32,power_law_1.2,1.2859711647033691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,4,balanced,1.699168046315511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,4,balanced,1.7064053217569988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,4,power_law_1.01,1.8199743270874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,4,power_law_1.01,1.960927963256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,4,power_law_1.2,1.9555135726928712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,4,power_law_1.2,2.0272064208984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,8,balanced,1.3025866349538167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,8,balanced,1.304527997970581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,8,power_law_1.01,1.446073627471924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,8,power_law_1.01,1.4710016250610352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,8,power_law_1.2,1.6159616470336915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,1,8,power_law_1.2,1.6486143112182616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,16,1,balanced,0.9368746280670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,16,1,balanced,0.9373226960500082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,16,1,power_law_1.01,0.960108757019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,16,1,power_law_1.01,0.9617728233337403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,16,1,power_law_1.2,0.9626560211181641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,16,1,power_law_1.2,0.9651712417602539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,2,1,balanced,2.3232480684916177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,2,1,balanced,2.348911921183268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,2,1,power_law_1.01,2.2810943603515623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,2,1,power_law_1.01,2.347360038757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,2,1,power_law_1.2,2.3363519668579102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,2,1,power_law_1.2,2.393516731262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,32,1,balanced,0.8577120304107666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,32,1,balanced,0.8582239945729574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,32,1,power_law_1.01,0.8632255554199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,32,1,power_law_1.01,0.866214370727539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,32,1,power_law_1.2,0.8722240447998046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,32,1,power_law_1.2,0.8754688262939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,4,1,balanced,1.4981120427449544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,4,1,balanced,1.510170618693034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,4,1,power_law_1.01,1.5042752265930175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,4,1,power_law_1.01,1.5055359840393066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,4,1,power_law_1.2,1.5124735832214355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,4,1,power_law_1.2,1.5178815841674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,8,1,balanced,1.1040693124135335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,8,1,balanced,1.105733315149943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,8,1,power_law_1.01,1.1053695678710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,8,1,power_law_1.01,1.1098112106323241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,8,1,power_law_1.2,1.1126272201538085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,6144,2560,8,160,8,1,power_law_1.2,1.1143232345581056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,1,balanced,4.441909472147624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,1,balanced,4.503237406412761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,1,power_law_1.01,4.651916885375977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,1,power_law_1.01,4.654137420654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,1,power_law_1.2,4.77130241394043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,1,power_law_1.2,4.9222465515136715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,128,balanced,0.9765973091125488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,128,balanced,0.9783679644266764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,128,power_law_1.01,1.0538559913635255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,128,power_law_1.01,1.0596608161926269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,128,power_law_1.2,1.1104384422302247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,128,power_law_1.2,1.1119039535522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,16,balanced,1.1647199789683025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,16,balanced,1.1647306283315022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,16,power_law_1.01,1.2873472213745116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,16,power_law_1.01,1.3289536476135253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,16,power_law_1.2,1.3784704208374023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,16,power_law_1.2,1.3882752418518067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,2,balanced,2.632693290710449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,2,balanced,2.646341323852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,2,power_law_1.01,2.8184320449829103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,2,power_law_1.01,2.8678400039672853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,2,power_law_1.2,2.9339263916015623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,2,power_law_1.2,2.9518463134765627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,256,balanced,0.9650239944458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,256,balanced,0.966111977895101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,256,power_law_1.01,1.0264512062072755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,256,power_law_1.01,1.0278207778930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,256,power_law_1.2,1.0873215675354004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,256,power_law_1.2,1.0922240257263183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,32,balanced,1.0591519673665364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,32,balanced,1.0621813138326008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,32,power_law_1.01,1.144422435760498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,32,power_law_1.01,1.1680768013000489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,32,power_law_1.2,1.1985792160034179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,32,power_law_1.2,1.2121024131774902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,4,balanced,1.787178675333659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,4,balanced,1.7893865903218586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,4,power_law_1.01,2.002649688720703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,4,power_law_1.01,2.0093055725097657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,4,power_law_1.2,2.0238975524902343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,4,power_law_1.2,2.03756160736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,64,balanced,1.0030720233917236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,64,balanced,1.006815989812215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,64,power_law_1.01,1.0965184211730956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,64,power_law_1.01,1.1026368141174316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,64,power_law_1.2,1.1430463790893555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,64,power_law_1.2,1.1609343528747558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,8,balanced,1.377962589263916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,8,balanced,1.377994696299235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,8,power_law_1.01,1.4912256240844726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,8,power_law_1.01,1.5391615867614745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,8,power_law_1.2,1.5487615585327148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,1,8,power_law_1.2,1.5818495750427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,16,1,balanced,1.0421866575876872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,16,1,balanced,1.0431093374888103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,16,1,power_law_1.01,1.071571159362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,16,1,power_law_1.01,1.0742464065551758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,16,1,power_law_1.2,1.087929630279541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,16,1,power_law_1.2,1.0889087677001954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,2,1,balanced,2.4650932947794595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,2,1,balanced,2.505573272705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,2,1,power_law_1.01,2.5764928817749024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,2,1,power_law_1.01,2.5978879928588867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,2,1,power_law_1.2,2.62172794342041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,2,1,power_law_1.2,2.6633983612060548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,32,1,balanced,0.9569546381632487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,32,1,balanced,0.9572479724884033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,32,1,power_law_1.01,0.9875007629394531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,32,1,power_law_1.01,0.9893440246582031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,32,1,power_law_1.2,0.9995455741882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,32,1,power_law_1.2,1.0003392219543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,4,1,balanced,1.607594648996989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,4,1,balanced,1.6161972681681316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,4,1,power_law_1.01,1.7019968032836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,4,1,power_law_1.01,1.7076351165771484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,4,1,power_law_1.2,1.7224063873291016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,4,1,power_law_1.2,1.735308837890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,8,1,balanced,1.2271040280659993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,8,1,balanced,1.229093313217163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,8,1,power_law_1.01,1.2770560264587403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,8,1,power_law_1.01,1.287769603729248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,8,1,power_law_1.2,1.2972736358642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,256,8,1,power_law_1.2,1.3006848335266112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,1,balanced,4.305535952250163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,1,balanced,4.331631978352864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,1,power_law_1.01,5.455712127685547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,1,power_law_1.01,5.653196716308594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,1,power_law_1.2,5.559257507324219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,1,power_law_1.2,5.932735824584961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,128,balanced,1.0279466311136882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,128,balanced,1.0295519828796387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,128,power_law_1.01,1.0929792404174805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,128,power_law_1.01,1.1020095825195313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,128,power_law_1.2,1.1323391914367675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,128,power_law_1.2,1.134540843963623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,16,balanced,1.2053866386413574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,16,balanced,1.2081973552703857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,16,power_law_1.01,1.3626751899719238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,16,power_law_1.01,1.3765695571899415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,16,power_law_1.2,1.403264045715332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,16,power_law_1.2,1.4114432334899902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,2,balanced,2.6807146072387695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,2,balanced,2.7818241119384766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,2,power_law_1.01,3.224844741821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,2,power_law_1.01,3.2259902954101562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,2,power_law_1.2,3.3683712005615236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,2,power_law_1.2,3.387577438354492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,32,balanced,1.106607993443807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,32,balanced,1.1067466735839844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,32,power_law_1.01,1.2136704444885253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,32,power_law_1.01,1.2264320373535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,32,power_law_1.2,1.2660736083984374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,32,power_law_1.2,1.2712127685546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,4,balanced,1.8105653127034504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,4,balanced,1.814575990041097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,4,power_law_1.01,2.1768896102905275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,4,power_law_1.01,2.197887992858887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,4,power_law_1.2,2.265145683288574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,4,power_law_1.2,2.2722944259643554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,64,balanced,1.0527253150939941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,64,balanced,1.053066651026408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,64,power_law_1.01,1.1384639739990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,64,power_law_1.01,1.150656032562256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,64,power_law_1.2,1.1682304382324218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,64,power_law_1.2,1.1859775543212892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,8,balanced,1.4146773020426433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,8,balanced,1.4159092903137207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,8,power_law_1.01,1.624460792541504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,8,power_law_1.01,1.6524927139282226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,8,power_law_1.2,1.699295997619629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,1,8,power_law_1.2,1.7151039123535157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,16,1,balanced,1.0156213442484539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,16,1,balanced,1.0168373584747314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,16,1,power_law_1.01,1.1957440376281738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,16,1,power_law_1.01,1.1957951545715333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,16,1,power_law_1.2,1.218118381500244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,16,1,power_law_1.2,1.2191231727600098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,2,1,balanced,2.433231989542643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,2,1,balanced,2.4623573621114097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,2,1,power_law_1.01,2.995078468322754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,2,1,power_law_1.01,3.0032447814941405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,2,1,power_law_1.2,3.1096319198608398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,2,1,power_law_1.2,3.127903938293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,32,1,balanced,0.9457333087921143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,32,1,balanced,0.9462080001831055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,32,1,power_law_1.01,1.0988927841186524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,32,1,power_law_1.01,1.0999360084533691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,32,1,power_law_1.2,1.1220224380493165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,32,1,power_law_1.2,1.1224512100219726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,4,1,balanced,1.5753919283548992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,4,1,balanced,1.5827892621358235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,4,1,power_law_1.01,1.9173503875732423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,4,1,power_law_1.01,1.9322431564331055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,4,1,power_law_1.2,1.9830144882202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,4,1,power_law_1.2,2.0003839492797852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,8,1,balanced,1.211839993794759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,8,1,balanced,1.214026689529419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,8,1,power_law_1.01,1.4278016090393066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,8,1,power_law_1.01,1.4320192337036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,8,1,power_law_1.2,1.4787712097167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,6144,7168,2048,8,384,8,1,power_law_1.2,1.4822400093078614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,1,balanced,0.1530506710211436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,1,balanced,0.15364799896876016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,1,power_law_1.01,0.13927040100097657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,1,power_law_1.01,0.14206080436706542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,1,power_law_1.2,0.13955199718475342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,1,power_law_1.2,0.1423616051673889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,128,balanced,0.033589333295822144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,128,balanced,0.03379733363787333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,128,power_law_1.01,0.0323199987411499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,128,power_law_1.01,0.03335039913654327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,128,power_law_1.2,0.03199360072612763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,128,power_law_1.2,0.03260799944400787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,16,balanced,0.039503999054431915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,16,balanced,0.03966933240493139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,16,power_law_1.01,0.0379967987537384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,16,power_law_1.01,0.038099199533462524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,16,power_law_1.2,0.037887999415397645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,16,power_law_1.2,0.03825919926166534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,2,balanced,0.09726933638254802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,2,balanced,0.09911466638247173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,2,power_law_1.01,0.089273601770401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,2,power_law_1.01,0.0918720006942749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,2,power_law_1.2,0.09183359742164612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,2,power_law_1.2,0.09185280203819275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,32,balanced,0.03563733398914337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,32,balanced,0.03583999971548716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,32,power_law_1.01,0.033548799157142636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,32,power_law_1.01,0.034092798829078674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,32,power_law_1.2,0.03455359935760498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,32,power_law_1.2,0.03461120128631592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,4,balanced,0.0672159989674886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,4,balanced,0.06844266752401988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,4,power_law_1.01,0.0658623993396759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,4,power_law_1.01,0.06705920100212097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,4,power_law_1.2,0.0657472014427185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,4,power_law_1.2,0.06676480174064636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,64,balanced,0.033557333052158356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,64,balanced,0.03356799980004629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,64,power_law_1.01,0.03258239924907684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,64,power_law_1.01,0.03287039995193482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,64,power_law_1.2,0.03304960131645203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,64,power_law_1.2,0.0333759993314743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,8,balanced,0.04994133114814758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,8,balanced,0.05110399921735128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,8,power_law_1.01,0.046137601137161255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,8,power_law_1.01,0.047225600481033324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,8,power_law_1.2,0.045721599459648134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,1,8,power_law_1.2,0.04864639937877655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,2,1,balanced,0.09854400157928467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,2,1,balanced,0.10051733255386353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,2,1,power_law_1.01,0.09102720022201538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,2,1,power_law_1.01,0.09185919761657715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,2,1,power_law_1.2,0.09284480214118958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,2,1,power_law_1.2,0.09367679953575134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,4,1,balanced,0.07388799885908763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,4,1,balanced,0.07430399954319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,4,1,power_law_1.01,0.069651198387146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,4,1,power_law_1.01,0.07043840289115906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,4,1,power_law_1.2,0.07091839909553528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2048,768,8,128,4,1,power_law_1.2,0.07141119837760926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,1,balanced,0.38551998138427734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,1,balanced,0.3872053225835164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,1,power_law_1.01,0.3232448101043701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,1,power_law_1.01,0.3280895948410034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,1,power_law_1.2,0.3276927947998047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,1,power_law_1.2,0.3280384063720703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,128,balanced,0.03965333352486292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,128,balanced,0.03976533313592275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,128,power_law_1.01,0.03891839981079102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,128,power_law_1.01,0.038975998759269714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,128,power_law_1.2,0.038771200180053714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,128,power_law_1.2,0.03932160139083862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,16,balanced,0.06579199930032094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,16,balanced,0.06643199920654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,16,power_law_1.01,0.06394240260124207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,16,power_law_1.01,0.06394879817962647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,16,power_law_1.2,0.06149759888648987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,16,power_law_1.2,0.06257920265197754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,2,balanced,0.21917865673700967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,2,balanced,0.22059732675552368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,2,power_law_1.01,0.17982720136642455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,2,power_law_1.01,0.19568639993667603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,2,power_law_1.2,0.18892799615859984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,2,power_law_1.2,0.1897663950920105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,32,balanced,0.04649066428343455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,32,balanced,0.047872001926104225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,32,power_law_1.01,0.04576640129089356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,32,power_law_1.01,0.04644480049610138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,32,power_law_1.2,0.046035200357437134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,32,power_law_1.2,0.04653440117835998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,4,balanced,0.13383466998736063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,4,balanced,0.13429333766301474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,4,power_law_1.01,0.12030080556869507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,4,power_law_1.01,0.12130559682846069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,4,power_law_1.2,0.11661440134048462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,4,power_law_1.2,0.11978880167007447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,64,balanced,0.04372799893220266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,64,balanced,0.04389866689840952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,64,power_law_1.01,0.0421887993812561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,64,power_law_1.01,0.04237439930438995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,64,power_law_1.2,0.04270719885826111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,64,power_law_1.2,0.04296959936618805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,8,balanced,0.09291199843088786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,8,balanced,0.09303999940554301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,8,power_law_1.01,0.08054400086402894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,8,power_law_1.01,0.08477439880371093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,8,power_law_1.2,0.08260480165481568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,1,8,power_law_1.2,0.08536319732666016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,16,1,balanced,0.2416426738103231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,16,1,balanced,0.24241065979003906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,16,1,power_law_1.01,0.2083712100982666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,16,1,power_law_1.01,0.21182079315185548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,16,1,power_law_1.2,0.20723841190338135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,16,1,power_law_1.2,0.21125121116638185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,2,1,balanced,0.22430400053660074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,2,1,balanced,0.22470933198928833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,2,1,power_law_1.01,0.19011839628219604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,2,1,power_law_1.01,0.19236479997634887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,2,1,power_law_1.2,0.19545600414276124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,2,1,power_law_1.2,0.19712640047073365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,32,1,balanced,0.2164106567700704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,32,1,balanced,0.2174560030301412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,32,1,power_law_1.01,0.1841215968132019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,32,1,power_law_1.01,0.18554240465164185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,32,1,power_law_1.2,0.18490879535675048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,32,1,power_law_1.2,0.1888576030731201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,4,1,balanced,0.13913599650065103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,4,1,balanced,0.1394773324330648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,4,1,power_law_1.01,0.12008320093154908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,4,1,power_law_1.01,0.12123520374298095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,4,1,power_law_1.2,0.12079360485076904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,4,1,power_law_1.2,0.12387839555740357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,8,1,balanced,0.3017599980036418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,8,1,balanced,0.30295999844868976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,8,1,power_law_1.01,0.2519615888595581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,8,1,power_law_1.01,0.2537791967391968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,8,1,power_law_1.2,0.2454591989517212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,2688,1856,6,128,8,1,power_law_1.2,0.26182401180267334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,1,balanced,0.6853439807891846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,1,balanced,0.7077919642130533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,1,power_law_1.01,0.5295423984527587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,1,power_law_1.01,0.5348351955413818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,1,power_law_1.2,0.5143167972564697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,1,power_law_1.2,0.5160064220428466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,128,balanced,0.0418453315893809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,128,balanced,0.041850666205088295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,128,power_law_1.01,0.040915200114250184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,128,power_law_1.01,0.04097279906272888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,128,power_law_1.2,0.041119998693466185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,128,power_law_1.2,0.04159359931945801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,16,balanced,0.08555733164151509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,16,balanced,0.08730666836102803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,16,power_law_1.01,0.08021759986877441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,16,power_law_1.01,0.0815999984741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,16,power_law_1.2,0.07603840231895446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,16,power_law_1.2,0.07942399978637696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,2,balanced,0.369706670443217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,2,balanced,0.37548800309499103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,2,power_law_1.01,0.2987584114074707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,2,power_law_1.01,0.29901440143585206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,2,power_law_1.2,0.26981120109558104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,2,power_law_1.2,0.29818880558013916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,256,balanced,0.04042666653792063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,256,balanced,0.04154666761557261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,256,power_law_1.01,0.038867199420928956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,256,power_law_1.01,0.03930239975452423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,256,power_law_1.2,0.03999359905719757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,256,power_law_1.2,0.04069760143756866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,32,balanced,0.0683786670366923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,32,balanced,0.07035199801127116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,32,power_law_1.01,0.061318397521972656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,32,power_law_1.01,0.0643392026424408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,32,power_law_1.2,0.0584384024143219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,32,power_law_1.2,0.0640447974205017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,4,balanced,0.20560000340143839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,4,balanced,0.20662933588027954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,4,power_law_1.01,0.18264960050582885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,4,power_law_1.01,0.1826815962791443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,4,power_law_1.2,0.16503039598464966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,4,power_law_1.2,0.17785600423812867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,64,balanced,0.04797333478927612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,64,power_law_1.01,0.04672000110149384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,64,power_law_1.01,0.047654399275779726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,64,power_law_1.2,0.04759039878845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,64,power_law_1.2,0.047603198885917665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,8,balanced,0.12660266955693564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,8,balanced,0.12808533509572348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,8,power_law_1.01,0.11704959869384765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,8,power_law_1.01,0.12053120136260986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,8,power_law_1.2,0.10726399421691894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,1,8,power_law_1.2,0.11471999883651733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,16,1,balanced,0.11168000102043152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,16,1,balanced,0.11328533291816711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,16,1,power_law_1.01,0.09378560185432434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,16,1,power_law_1.01,0.0941760003566742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,16,1,power_law_1.2,0.09249920248985291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,16,1,power_law_1.2,0.09288319945335388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,2,1,balanced,0.377674659093221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,2,1,balanced,0.378490686416626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,2,1,power_law_1.01,0.2903167963027954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,2,1,power_law_1.01,0.29395198822021484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,2,1,power_law_1.2,0.28485760688781736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,2,1,power_law_1.2,0.2928319931030273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,32,1,balanced,0.10060800115267436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,32,1,balanced,0.10150399804115295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,32,1,power_law_1.01,0.08056960105895997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,32,1,power_law_1.01,0.08346239924430847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,32,1,power_law_1.2,0.08106240034103393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,4,1,balanced,0.2242506742477417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,4,1,balanced,0.23031467199325562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,4,1,power_law_1.01,0.17587200403213502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,4,1,power_law_1.01,0.1778048038482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,4,1,power_law_1.2,0.17423360347747802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,4,1,power_law_1.2,0.17599999904632568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,8,1,balanced,0.15556266903877258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,8,1,balanced,0.15582933028539023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,8,1,power_law_1.01,0.12718080282211303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,8,1,power_law_1.01,0.12833280563354493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,8,1,power_law_1.2,0.12718080282211303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,3072,1536,8,256,8,1,power_law_1.2,0.12788480520248413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,1,balanced,0.3293600082397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,1,balanced,0.33050666252772015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,1,power_law_1.01,0.3473088026046753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,1,power_law_1.01,0.3571775913238525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,1,power_law_1.2,0.34977920055389405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,1,power_law_1.2,0.35399680137634276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,2,balanced,0.22124266624450684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,2,balanced,0.22821333010991415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,2,power_law_1.01,0.22318720817565918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,2,power_law_1.01,0.22432639598846435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,2,power_law_1.2,0.22641279697418212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,2,power_law_1.2,0.23150079250335692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,4,balanced,0.15255999565124512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,4,balanced,0.15704533457756042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,4,power_law_1.01,0.16213120222091676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,4,power_law_1.01,0.1704319953918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,4,power_law_1.2,0.16895359754562378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,4,power_law_1.2,0.17517440319061278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,8,balanced,0.1218933363755544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,8,balanced,0.12643733620643616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,8,power_law_1.01,0.14279680252075194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,8,power_law_1.01,0.1429759979248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,8,power_law_1.2,0.1385856032371521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,1,8,power_law_1.2,0.1419584035873413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,16,1,balanced,0.047930667797724404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,16,1,balanced,0.04990399877230326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,16,1,power_law_1.01,0.05025280117988586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,16,1,power_law_1.01,0.0506496012210846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,16,1,power_law_1.2,0.05002880096435547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,16,1,power_law_1.2,0.05370879769325256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,2,1,balanced,0.19283199310302734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,2,1,balanced,0.2299519975980123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,2,1,power_law_1.01,0.18852479457855226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,2,1,power_law_1.01,0.19472639560699462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,2,1,power_law_1.2,0.19071359634399415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,2,1,power_law_1.2,0.1930176019668579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,32,1,balanced,0.03736000011364619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,32,1,balanced,0.03769599894682566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,32,1,power_law_1.01,0.03596799969673157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,32,1,power_law_1.01,0.03632639944553375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,32,1,power_law_1.2,0.036320000886917114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,32,1,power_law_1.2,0.036422398686408994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,4,1,balanced,0.11337066690127055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,4,1,balanced,0.11371733744939168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,4,1,power_law_1.01,0.11194239854812622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,4,1,power_law_1.01,0.11336319446563721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,4,1,power_law_1.2,0.11228159666061402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,4,1,power_law_1.2,0.11347839832305909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,8,1,balanced,0.07706666489442189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,8,1,balanced,0.07752533257007599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,8,1,power_law_1.01,0.07348480224609374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,8,1,power_law_1.01,0.07441279888153077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,8,1,power_law_1.2,0.07329279780387879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,14336,2,8,8,1,power_law_1.2,0.0756991982460022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,1,balanced,0.46963731447855633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,1,balanced,0.4699360132217407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,1,power_law_1.01,0.42366719245910645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,1,power_law_1.01,0.42829442024230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,1,power_law_1.2,0.4238463878631592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,1,power_law_1.2,0.4353919982910156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,128,balanced,0.04181333382924398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,128,balanced,0.04376000165939331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,128,power_law_1.01,0.04188160002231598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,128,power_law_1.01,0.04207360148429871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,128,power_law_1.2,0.04216319918632507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,128,power_law_1.2,0.04222719967365265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,16,balanced,0.07854400078455608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,16,balanced,0.07865066826343536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,16,power_law_1.01,0.07554559707641602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,16,power_law_1.01,0.07560960054397584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,16,power_law_1.2,0.07221119999885559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,16,power_law_1.2,0.07408639788627625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,2,balanced,0.2592853307723999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,2,balanced,0.2600373427073161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,2,power_law_1.01,0.23923840522766113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,2,power_law_1.01,0.23932158946990967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,2,power_law_1.2,0.24217600822448732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,2,power_law_1.2,0.24418559074401855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,32,balanced,0.05402666827042898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,32,balanced,0.05499200026194254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,32,power_law_1.01,0.054028797149658206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,32,power_law_1.01,0.05445759892463684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,32,power_law_1.2,0.052748799324035645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,32,power_law_1.2,0.05368959903717041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,4,balanced,0.15413332978884378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,4,balanced,0.15499732891718546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,4,power_law_1.01,0.1429695963859558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,4,power_law_1.01,0.14652160406112671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,4,power_law_1.2,0.14366719722747803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,4,power_law_1.2,0.14744319915771484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,64,balanced,0.04391466577847799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,64,balanced,0.04573333263397217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,64,power_law_1.01,0.04426240026950836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,64,power_law_1.01,0.044627198576927186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,64,power_law_1.2,0.04410879909992218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,64,power_law_1.2,0.04426240026950836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,8,balanced,0.10103999574979146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,8,balanced,0.10249066352844238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,8,power_law_1.01,0.09841279983520508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,8,power_law_1.01,0.09992319941520691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,8,power_law_1.2,0.09671679735183716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,1,8,power_law_1.2,0.09902080297470092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,16,1,balanced,0.08773333827654521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,16,1,balanced,0.08859733740488689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,16,1,power_law_1.01,0.08294399976730346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,16,1,power_law_1.01,0.08407679796218873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,16,1,power_law_1.2,0.08370559811592101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,16,1,power_law_1.2,0.0837119996547699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,2,1,balanced,0.26393065849939984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,2,1,balanced,0.2655093272527059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,2,1,power_law_1.01,0.235481595993042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,2,1,power_law_1.01,0.2408128023147583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,2,1,power_law_1.2,0.24213759899139403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,2,1,power_law_1.2,0.24588160514831542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,32,1,balanced,0.0745600014925003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,32,1,balanced,0.07495466868082683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,32,1,power_law_1.01,0.06988800168037415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,32,1,power_law_1.01,0.07035520076751708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,32,1,power_law_1.2,0.07099519968032837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,32,1,power_law_1.2,0.07175679802894593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,4,1,balanced,0.16354133685429892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,4,1,balanced,0.176581343015035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,4,1,power_law_1.01,0.14988160133361816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,4,1,power_law_1.01,0.15018880367279053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,4,1,power_law_1.2,0.1502527952194214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,4,1,power_law_1.2,0.15086079835891725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,8,1,balanced,0.1172106663386027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,8,1,balanced,0.11773332953453064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,8,1,power_law_1.01,0.11013760566711425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,8,1,power_law_1.01,0.11088000535964966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,8,1,power_law_1.2,0.11021440029144287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,1536,8,128,8,1,power_law_1.2,0.11184639930725097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,1,balanced,3.1963094075520835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,1,balanced,3.3002293904622397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,1,power_law_1.01,2.4652736663818358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,1,power_law_1.01,2.5267839431762695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,1,power_law_1.2,2.426777648925781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,1,power_law_1.2,2.5770240783691407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,128,balanced,0.10354133447011311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,128,balanced,0.10359999537467957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,128,power_law_1.01,0.10117119550704956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,128,power_law_1.01,0.10280959606170655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,128,power_law_1.2,0.10096640586853027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,128,power_law_1.2,0.10220799446105958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,16,balanced,0.2698506712913513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,16,balanced,0.2707359989484151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,16,power_law_1.01,0.2415679931640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,16,power_law_1.01,0.24751360416412355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,16,power_law_1.2,0.23649919033050537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,16,power_law_1.2,0.24763519763946534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,2,balanced,1.5339360237121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,2,balanced,1.5866719881693523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,2,power_law_1.01,1.2618111610412597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,2,power_law_1.01,1.281043243408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,2,power_law_1.2,1.3086079597473144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,2,power_law_1.2,1.337343978881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,256,balanced,0.08542933066685994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,256,balanced,0.09074667096138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,256,power_law_1.01,0.08750079870223999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,256,power_law_1.01,0.08854399919509888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,256,power_law_1.2,0.08587520122528076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,256,power_law_1.2,0.0862272024154663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,32,balanced,0.17726399501164755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,32,balanced,0.17896533012390137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,32,power_law_1.01,0.16488319635391235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,32,power_law_1.01,0.16917120218276976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,32,power_law_1.2,0.1675647974014282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,32,power_law_1.2,0.17069439888000487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,4,balanced,0.8076480229695638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,4,balanced,0.8087626298268636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,4,power_law_1.01,0.6992000102996826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,4,power_law_1.01,0.7326528072357178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,4,power_law_1.2,0.6971776008605957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,4,power_law_1.2,0.7207295894622803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,64,balanced,0.12944533427556357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,64,balanced,0.1297653317451477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,64,power_law_1.01,0.12417279481887818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,64,power_law_1.01,0.12616959810256959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,64,power_law_1.2,0.12121599912643433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,64,power_law_1.2,0.12499840259552002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,8,balanced,0.44760000705718994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,8,balanced,0.45018664995829266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,8,power_law_1.01,0.3854912042617798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,8,power_law_1.01,0.4048895835876465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,8,power_law_1.2,0.410643196105957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,1,8,power_law_1.2,0.4293824195861816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,16,1,balanced,1.5909546216328938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,16,1,balanced,1.593450705210368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,16,1,power_law_1.01,1.3141504287719727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,16,1,power_law_1.01,1.324300765991211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,16,1,power_law_1.2,1.3015616416931153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,16,1,power_law_1.2,1.311366367340088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,2,1,balanced,1.571232000986735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,2,1,balanced,1.6472053527832031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,2,1,power_law_1.01,1.2883584022521972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,2,1,power_law_1.01,1.3116671562194824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,2,1,power_law_1.2,1.305561637878418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,2,1,power_law_1.2,1.3093376159667969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,32,1,balanced,1.259930690129598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,32,1,balanced,1.2622826894124348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,32,1,power_law_1.01,1.0370176315307618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,32,1,power_law_1.01,1.051411247253418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,32,1,power_law_1.2,1.0457599639892579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,32,1,power_law_1.2,1.0544192314147949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,4,1,balanced,0.8726507027943929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,4,1,balanced,0.8740800221761068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,4,1,power_law_1.01,0.7230912208557129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,4,1,power_law_1.01,0.7233856201171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,4,1,power_law_1.2,0.7113215923309326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,4,1,power_law_1.2,0.731001615524292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,8,1,balanced,0.5153973499933878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,8,1,balanced,0.5289119879404703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,8,1,power_law_1.01,0.42679681777954104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,8,1,power_law_1.01,0.431276798248291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,8,1,power_law_1.2,0.4304512023925781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,4096,2688,22,512,8,1,power_law_1.2,0.43114237785339354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,1,balanced,0.490506649017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,1,balanced,0.49582401911417645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,1,power_law_1.01,0.5472000122070313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,1,power_law_1.01,0.5472896099090576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,1,power_law_1.2,0.5432384014129639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,1,power_law_1.2,0.5568895816802979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,2,balanced,0.3080586592356364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,2,balanced,0.3157866597175598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,2,power_law_1.01,0.3322432041168213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,2,power_law_1.01,0.36160640716552733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,2,power_law_1.2,0.3502527952194214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,2,power_law_1.2,0.3505536079406738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,4,balanced,0.21313599745432535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,4,balanced,0.2185386617978414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,4,power_law_1.01,0.24092159271240235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,4,power_law_1.01,0.24116480350494385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,4,power_law_1.2,0.24261760711669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,4,power_law_1.2,0.25311999320983886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,8,balanced,0.16292267044385275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,8,balanced,0.16502933700879416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,8,power_law_1.01,0.1889855980873108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,8,power_law_1.01,0.18971519470214843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,8,power_law_1.2,0.18878719806671143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,1,8,power_law_1.2,0.18952959775924683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,16,1,balanced,0.07215466598669688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,16,1,balanced,0.07253333429495494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,16,1,power_law_1.01,0.074726402759552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,16,1,power_law_1.01,0.07507200241088867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,16,1,power_law_1.2,0.07268480062484742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,16,1,power_law_1.2,0.07354239821434021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,2,1,balanced,0.27007466554641724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,2,1,balanced,0.2797653277715047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,2,1,power_law_1.01,0.27930240631103515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,2,1,power_law_1.01,0.28405759334564207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,2,1,power_law_1.2,0.27952640056610106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,2,1,power_law_1.2,0.2933056116104126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,32,1,balanced,0.044218664367993675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,32,1,balanced,0.05067733426888784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,32,1,power_law_1.01,0.052697598934173584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,32,1,power_law_1.01,0.05429120063781738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,32,1,power_law_1.2,0.053830397129058835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,32,1,power_law_1.2,0.054041600227355956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,4,1,balanced,0.1611786683400472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,4,1,balanced,0.2007253368695577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,4,1,power_law_1.01,0.16703360080718993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,4,1,power_law_1.01,0.1674239993095398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,4,1,power_law_1.2,0.16480640172958375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,4,1,power_law_1.2,0.17993600368499757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,8,1,balanced,0.11552000045776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,8,1,balanced,0.12504000465075174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,8,1,power_law_1.01,0.10421119928359986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,8,1,power_law_1.01,0.10450559854507446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,8,1,power_law_1.2,0.10460159778594971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,16384,2,8,8,1,power_law_1.2,0.10665600299835205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,1,balanced,1.737610658009847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,1,balanced,1.8237066268920898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,1,power_law_1.01,1.3039487838745116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,1,power_law_1.01,1.306060791015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,1,power_law_1.2,1.303212833404541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,1,power_law_1.2,1.3210559844970704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,128,balanced,0.07035199801127116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,128,balanced,0.07066666583220164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,128,power_law_1.01,0.06925439834594727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,128,power_law_1.01,0.069651198387146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,128,power_law_1.2,0.06958079934120179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,128,power_law_1.2,0.07089279890060425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,16,balanced,0.17087467511494955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,16,balanced,0.17181867361068726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,16,power_law_1.01,0.15441919565200807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,16,power_law_1.01,0.15827840566635132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,16,power_law_1.2,0.1510655999183655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,16,power_law_1.2,0.15404800176620484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,2,balanced,0.8989386558532715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,2,balanced,0.9061226844787598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,2,power_law_1.01,0.6636223793029785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,2,power_law_1.01,0.6899392127990722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,2,power_law_1.2,0.6674304008483887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,2,power_law_1.2,0.6959360122680665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,256,balanced,0.058101331194241844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,256,balanced,0.058117335041364036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,256,power_law_1.01,0.056441599130630495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,256,power_law_1.01,0.056953597068786624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,256,power_law_1.2,0.056441599130630495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,256,power_law_1.2,0.056953597068786624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,32,balanced,0.11758933464686076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,32,balanced,0.11776533722877502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,32,power_law_1.01,0.11146880388259887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,32,power_law_1.01,0.11371519565582275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,32,power_law_1.2,0.1001471996307373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,32,power_law_1.2,0.10735360383987427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,4,balanced,0.4775306781133016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,4,balanced,0.48578135172526044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,4,power_law_1.01,0.3921216011047363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,4,power_law_1.01,0.42699518203735354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,4,power_law_1.2,0.3467711925506592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,4,power_law_1.2,0.42697601318359374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,64,balanced,0.08932266632715861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,64,balanced,0.0909546713034312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,64,power_law_1.01,0.08559359908103943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,64,power_law_1.01,0.08664320111274719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,64,power_law_1.2,0.08563200235366822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,64,power_law_1.2,0.08604159951210022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,8,balanced,0.2720693349838257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,8,balanced,0.2736533284187317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,8,power_law_1.01,0.23393919467926025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,8,power_law_1.01,0.2395711898803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,8,power_law_1.2,0.22001919746398926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,1,8,power_law_1.2,0.23720960617065429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,16,1,balanced,0.2160586714744568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,16,1,balanced,0.21619200706481934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,16,1,power_law_1.01,0.16707839965820312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,16,1,power_law_1.01,0.16832640171051025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,16,1,power_law_1.2,0.16500480175018312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,16,1,power_law_1.2,0.1657663941383362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,2,1,balanced,0.9198666413625082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,2,1,balanced,0.9216907024383545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,2,1,power_law_1.01,0.7022592067718506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,2,1,power_law_1.01,0.7030911922454834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,2,1,power_law_1.2,0.6936575889587402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,2,1,power_law_1.2,0.6946176052093506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,32,1,balanced,0.17328532536824545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,32,1,balanced,0.17357333501180014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,32,1,power_law_1.01,0.14083839654922486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,32,1,power_law_1.01,0.14279680252075194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,32,1,power_law_1.2,0.14143999814987182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,32,1,power_law_1.2,0.14145920276641846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,4,1,balanced,0.5101120074590048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,4,1,balanced,0.510757327079773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,4,1,power_law_1.01,0.3971263885498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,4,1,power_law_1.01,0.4035647869110107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,4,1,power_law_1.2,0.3880896091461182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,4,1,power_law_1.2,0.3968192100524902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,8,1,balanced,0.31380265951156616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,8,1,balanced,0.3146986762682597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,8,1,power_law_1.01,0.24078080654144288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,8,1,power_law_1.01,0.24120960235595704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,8,1,power_law_1.2,0.24296960830688477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2048,8,256,8,1,power_law_1.2,0.24372479915618897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,1,balanced,1.3838507334391277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,1,balanced,1.4545493125915527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,1,power_law_1.01,1.141823959350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,1,power_law_1.01,1.173151969909668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,1,power_law_1.2,1.148147201538086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,1,power_law_1.2,1.205241584777832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,16,balanced,0.13843199610710144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,16,balanced,0.1414400041103363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,16,power_law_1.01,0.12935680150985718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,16,power_law_1.01,0.1335935950279236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,16,power_law_1.2,0.13367040157318116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,16,power_law_1.2,0.13419519662857055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,2,balanced,0.7091626326243082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,2,balanced,0.7132906913757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,2,power_law_1.01,0.6249472141265869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,2,power_law_1.01,0.6563263893127441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,2,power_law_1.2,0.5970751762390136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,2,power_law_1.2,0.6243648052215576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,32,balanced,0.09923733274141948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,32,balanced,0.09941333532333374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,32,power_law_1.01,0.09612799882888794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,32,power_law_1.01,0.09786880016326904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,32,power_law_1.2,0.09482240080833435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,32,power_law_1.2,0.09587200284004212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,4,balanced,0.3805066744486491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,4,balanced,0.3945759932200114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,4,power_law_1.01,0.3410752058029175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,4,power_law_1.01,0.3566848039627075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,4,power_law_1.2,0.3304768085479736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,4,power_law_1.2,0.34540159702301027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,8,balanced,0.2182933290799459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,8,balanced,0.21836266915003458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,8,power_law_1.01,0.2017280101776123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,8,power_law_1.01,0.2091775894165039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,8,power_law_1.2,0.20183680057525635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,1,8,power_law_1.2,0.20478720664978028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,16,1,balanced,0.17568532625834146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,16,1,balanced,0.17706666390101114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,16,1,power_law_1.01,0.15601279735565185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,16,1,power_law_1.01,0.1614400029182434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,16,1,power_law_1.2,0.15768959522247314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,16,1,power_law_1.2,0.16171519756317138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,2,1,balanced,0.7215147018432617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,2,1,balanced,0.7221333185831705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,2,1,power_law_1.01,0.611027193069458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,2,1,power_law_1.01,0.6138879776000976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,2,1,power_law_1.2,0.6111487865447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,2,1,power_law_1.2,0.6288576126098633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,32,1,balanced,0.1366933286190033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,32,1,balanced,0.13693867127100626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,32,1,power_law_1.01,0.12243839502334594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,32,1,power_law_1.01,0.12473599910736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,32,1,power_law_1.2,0.12206079959869384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,32,1,power_law_1.2,0.1247871994972229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,4,1,balanced,0.4004640181859334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,4,1,balanced,0.40060798327128094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,4,1,power_law_1.01,0.3467200040817261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,4,1,power_law_1.01,0.3525439977645874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,4,1,power_law_1.2,0.3478271961212158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,4,1,power_law_1.2,0.35256319046020507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,8,1,balanced,0.2505706747372945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,8,1,balanced,0.2528266708056132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,8,1,power_law_1.01,0.22088320255279542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,8,1,power_law_1.01,0.2252351999282837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,8,1,power_law_1.2,0.2219520092010498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,6144,2560,8,160,8,1,power_law_1.2,0.22400639057159424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,1,balanced,2.014224052429199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,1,balanced,2.0164106686909995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,1,power_law_1.01,1.515129566192627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,1,power_law_1.01,1.5612735748291016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,1,power_law_1.2,1.5090815544128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,1,power_law_1.2,1.5105024337768556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,128,balanced,0.08122666676839192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,128,balanced,0.08377599716186523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,128,power_law_1.01,0.07946879863739013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,128,power_law_1.01,0.08030719757080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,128,power_law_1.2,0.08138239979743958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,128,power_law_1.2,0.08157439827919007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,16,balanced,0.19472533464431763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,16,balanced,0.19498133659362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,16,power_law_1.01,0.15877120494842528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,16,power_law_1.01,0.1834879994392395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,16,power_law_1.2,0.1669376015663147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,16,power_law_1.2,0.17123199701309205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,2,balanced,1.0398080348968506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,2,balanced,1.0402613480885823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,2,power_law_1.01,0.8431808471679687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,2,power_law_1.01,0.851750373840332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,2,power_law_1.2,0.8013119697570801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,2,power_law_1.2,0.8103679656982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,256,balanced,0.0643146683772405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,256,balanced,0.06634133557478587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,256,power_law_1.01,0.06412799954414368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,256,power_law_1.01,0.06499199867248535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,256,power_law_1.2,0.062067198753356936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,256,power_law_1.2,0.0655232012271881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,32,balanced,0.1322879989941915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,32,balanced,0.13362133502960205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,32,power_law_1.01,0.11979520320892334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,32,power_law_1.01,0.12463999986648559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,32,power_law_1.2,0.11883519887924195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,32,power_law_1.2,0.12453759908676147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,4,balanced,0.5598346789677938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,4,balanced,0.6273333231608073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,4,power_law_1.01,0.44472317695617675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,4,power_law_1.01,0.47673602104187013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,4,power_law_1.2,0.46184959411621096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,4,power_law_1.2,0.4895296096801758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,64,balanced,0.10020800431569417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,64,balanced,0.10133333007494609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,64,power_law_1.01,0.09488000273704529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,64,power_law_1.01,0.09646720290184022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,64,power_law_1.2,0.09256319999694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,64,power_law_1.2,0.09686400294303894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,8,balanced,0.3145973285039266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,8,balanced,0.31863999366760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,8,power_law_1.01,0.25280640125274656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,8,power_law_1.01,0.2646656036376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,8,power_law_1.2,0.2702847957611084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,1,8,power_law_1.2,0.2805824041366577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,16,1,balanced,0.2462559938430786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,16,1,balanced,0.24692267179489136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,16,1,power_law_1.01,0.19088000059127808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,16,1,power_law_1.01,0.1928063988685608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,16,1,power_law_1.2,0.18983039855957032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,16,1,power_law_1.2,0.1906048059463501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,2,1,balanced,1.065882682800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,2,1,balanced,1.0664479732513428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,2,1,power_law_1.01,0.8085887908935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,2,1,power_law_1.01,0.8150848388671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,2,1,power_law_1.2,0.7899136066436767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,2,1,power_law_1.2,0.8151488304138184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,32,1,balanced,0.19582400719324747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,32,1,balanced,0.1967839996019999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,32,1,power_law_1.01,0.16135040521621705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,32,1,power_law_1.01,0.16481280326843262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,32,1,power_law_1.2,0.15930880308151246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,32,1,power_law_1.2,0.16125439405441283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,4,1,balanced,0.5901333491007487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,4,1,balanced,0.5954773426055908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,4,1,power_law_1.01,0.4583871841430664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,4,1,power_law_1.01,0.46010241508483884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,4,1,power_law_1.2,0.45427842140197755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,4,1,power_law_1.2,0.4546624183654785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,8,1,balanced,0.3622080087661743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,8,1,balanced,0.3708639939626058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,8,1,power_law_1.01,0.27869439125061035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,8,1,power_law_1.01,0.2813375949859619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,8,1,power_law_1.2,0.27263360023498534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,256,8,1,power_law_1.2,0.2778048038482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,1,balanced,3.112016042073568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,1,balanced,3.322554588317871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,1,power_law_1.01,2.0164031982421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,1,power_law_1.01,2.1301631927490234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,1,power_law_1.2,1.9235904693603516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,1,power_law_1.2,1.959097671508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,128,balanced,0.09734933574994405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,128,balanced,0.09788800279299419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,128,power_law_1.01,0.09573119878768921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,128,power_law_1.01,0.09631999731063842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,128,power_law_1.2,0.09456639885902404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,128,power_law_1.2,0.09573760032653808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,16,balanced,0.25410666068394977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,16,balanced,0.25566933552424115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,16,power_law_1.01,0.23651199340820311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,16,power_law_1.01,0.24842240810394287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,16,power_law_1.2,0.23255040645599365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,16,power_law_1.2,0.24172160625457764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,2,balanced,1.5318934122721355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,2,balanced,1.5344692866007488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,2,power_law_1.01,1.0773056030273438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,2,power_law_1.01,1.117407989501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,2,power_law_1.2,1.0683456420898438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,2,power_law_1.2,1.1011455535888672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,32,balanced,0.16340266664822897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,32,balanced,0.16404267152150473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,32,power_law_1.01,0.14965120553970337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,32,power_law_1.01,0.15569280385971068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,32,power_law_1.2,0.14797439575195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,32,power_law_1.2,0.1606528043746948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,4,balanced,0.801962693532308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,4,balanced,0.80348801612854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,4,power_law_1.01,0.6799488067626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,4,power_law_1.01,0.7130047798156738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,4,power_law_1.2,0.6716544151306152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,4,power_law_1.2,0.7065279960632325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,64,balanced,0.12147200107574463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,64,balanced,0.12230400244394939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,64,power_law_1.01,0.11466879844665527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,64,power_law_1.01,0.11559040546417236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,64,power_law_1.2,0.11044479608535766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,64,power_law_1.2,0.11808639764785767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,8,balanced,0.4349653323491414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,8,balanced,0.43776532014211017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,8,power_law_1.01,0.41296000480651857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,8,power_law_1.01,0.41680002212524414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,8,power_law_1.2,0.3608448028564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,1,8,power_law_1.2,0.4272319793701172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,16,1,balanced,0.3354133367538452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,16,1,balanced,0.33581864833831787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,16,1,power_law_1.01,0.250982403755188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,16,1,power_law_1.01,0.2560447931289673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,16,1,power_law_1.2,0.24222080707550048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,16,1,power_law_1.2,0.24451839923858643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,2,1,balanced,1.5714133580525715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,2,1,balanced,1.58787202835083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,2,1,power_law_1.01,1.0645312309265136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,2,1,power_law_1.01,1.0658432006835938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,2,1,power_law_1.2,1.0157695770263673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,2,1,power_law_1.2,1.0324288368225099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,32,1,balanced,0.27357866366704303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,32,1,balanced,0.27552000681559247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,32,1,power_law_1.01,0.20420479774475098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,32,1,power_law_1.01,0.20752639770507814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,32,1,power_law_1.2,0.19786880016326905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,32,1,power_law_1.2,0.19849599599838258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,4,1,balanced,0.863152027130127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,4,1,balanced,0.8641226291656494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,4,1,power_law_1.01,0.5952127933502197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,4,1,power_law_1.01,0.5980991840362548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,4,1,power_law_1.2,0.5836415767669678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,4,1,power_law_1.2,0.5843071937561035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,8,1,balanced,0.5081439812978109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,8,1,balanced,0.5107200145721436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,8,1,power_law_1.01,0.36217598915100097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,8,1,power_law_1.01,0.36408960819244385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,8,1,power_law_1.2,0.35019519329071047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,64,7168,2048,8,384,8,1,power_law_1.2,0.35260159969329835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,1,balanced,0.20441067218780518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,1,balanced,0.20547733704249063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,1,power_law_1.01,0.2097856044769287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,1,power_law_1.01,0.21094400882720948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,1,power_law_1.2,0.21927039623260497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,1,power_law_1.2,0.21971840858459474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,128,balanced,0.0764160007238388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,128,balanced,0.07662400106589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,128,power_law_1.01,0.07648640275001525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,128,power_law_1.01,0.07717120051383972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,128,power_law_1.2,0.0769599974155426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,128,power_law_1.2,0.07798399925231933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,16,balanced,0.08262933293978374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,16,balanced,0.084389328956604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,16,power_law_1.01,0.08802559971809387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,16,power_law_1.01,0.08977280259132385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,16,power_law_1.2,0.08787199854850769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,16,power_law_1.2,0.09014400243759155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,2,balanced,0.14751467108726501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,2,balanced,0.14754133423169455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,2,power_law_1.01,0.15652480125427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,2,power_law_1.01,0.15783679485321045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,2,power_law_1.2,0.15928959846496582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,2,power_law_1.2,0.16000640392303467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,32,balanced,0.07869333525498708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,32,balanced,0.08042133351167043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,32,power_law_1.01,0.08013439774513245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,32,power_law_1.01,0.08015360236167908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,32,power_law_1.2,0.08131840229034423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,32,power_law_1.2,0.0818560004234314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,4,balanced,0.11549866199493408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,4,balanced,0.11673067013422649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,4,power_law_1.01,0.11817599534988403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,4,power_law_1.01,0.12028160095214843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,4,power_law_1.2,0.12007679939270019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,4,power_law_1.2,0.12087039947509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,64,balanced,0.07705066601435344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,64,balanced,0.07865066826343536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,64,power_law_1.01,0.07727360129356384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,64,power_law_1.01,0.077292799949646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,64,power_law_1.2,0.07932159900665284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,64,power_law_1.2,0.07982720136642456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,8,balanced,0.09641066193580627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,8,balanced,0.09704533219337463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,8,power_law_1.01,0.09994879961013795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,8,power_law_1.01,0.10038399696350098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,8,power_law_1.2,0.10179840326309204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,1,8,power_law_1.2,0.10317440032958984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,2,1,balanced,0.14028799533843994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,2,1,balanced,0.14040533701578775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,2,1,power_law_1.01,0.1428287982940674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,2,1,power_law_1.01,0.14635519981384276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,2,1,power_law_1.2,0.1540992021560669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,2,1,power_law_1.2,0.15446399450302123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,4,1,balanced,0.11545067032178243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,4,1,balanced,0.11752532919247945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,4,1,power_law_1.01,0.11880960464477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,4,1,power_law_1.01,0.11938560009002686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,4,1,power_law_1.2,0.12156800031661988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2048,768,8,128,4,1,power_law_1.2,0.12250239849090576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,1,balanced,0.45820267995198566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,1,balanced,0.4601866801579793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,1,power_law_1.01,0.4608767986297607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,1,power_law_1.01,0.46274561882019044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,1,power_law_1.2,0.4739583969116211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,1,power_law_1.2,0.47715201377868655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,128,balanced,0.10521599650382996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,128,balanced,0.10670933127403259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,128,power_law_1.01,0.10721919536590577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,128,power_law_1.01,0.10732799768447876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,128,power_law_1.2,0.10830719470977783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,128,power_law_1.2,0.11052160263061524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,16,balanced,0.12967466314633688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,16,balanced,0.1299199958642324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,16,power_law_1.01,0.13395839929580688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,16,power_law_1.01,0.1351744055747986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,16,power_law_1.2,0.1356608033180237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,16,power_law_1.2,0.1371392011642456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,2,balanced,0.293013334274292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,2,balanced,0.2931893269220988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,2,power_law_1.01,0.2942080020904541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,2,power_law_1.01,0.297107195854187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,2,power_law_1.2,0.30159358978271483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,2,power_law_1.2,0.306329607963562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,32,balanced,0.11506133278210957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,32,balanced,0.11709866921106975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,32,power_law_1.01,0.11940480470657348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,32,power_law_1.01,0.11942399740219116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,32,power_law_1.2,0.11943680047988892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,32,power_law_1.2,0.12252800464630127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,4,balanced,0.20583999156951904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,4,balanced,0.20587732394536337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,4,power_law_1.01,0.20599040985107422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,4,power_law_1.01,0.20835840702056885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,4,power_law_1.2,0.21329920291900634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,4,power_law_1.2,0.21504640579223633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,64,balanced,0.10942932963371277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,64,balanced,0.11030933260917664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,64,power_law_1.01,0.11219840049743653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,64,power_law_1.01,0.11291520595550537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,64,power_law_1.2,0.11268479824066162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,64,power_law_1.2,0.11455999612808228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,8,balanced,0.1563093364238739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,8,balanced,0.15636799732844034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,8,power_law_1.01,0.16083840131759644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,8,power_law_1.01,0.16266239881515504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,8,power_law_1.2,0.16432000398635865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,1,8,power_law_1.2,0.16455039978027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,16,1,balanced,0.7826186815897623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,16,1,balanced,0.7860906918843588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,16,1,power_law_1.01,0.7965504169464112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,16,1,power_law_1.01,0.7977151870727539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,16,1,power_law_1.2,0.8456895828247071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,16,1,power_law_1.2,0.8499263763427735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,2,1,balanced,0.27937066555023193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,2,1,balanced,0.27962666749954224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,2,1,power_law_1.01,0.28022398948669436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,2,1,power_law_1.01,0.2830143928527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,2,1,power_law_1.2,0.28752000331878663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,2,1,power_law_1.2,0.2899712085723877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,32,1,balanced,0.6747626463572184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,32,1,balanced,0.6761706670125326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,32,1,power_law_1.01,0.6899072170257569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,32,1,power_law_1.01,0.7005695819854736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,32,1,power_law_1.2,0.7143231868743897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,32,1,power_law_1.2,0.7350848197937012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,4,1,balanced,0.18888533115386963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,4,1,balanced,0.18997333447138467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,4,1,power_law_1.01,0.18913919925689698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,4,1,power_law_1.01,0.18961280584335327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,4,1,power_law_1.2,0.1929471969604492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,4,1,power_law_1.2,0.19410560131072999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,8,1,balanced,1.0669546922047932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,8,1,balanced,1.1057120164235432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,8,1,power_law_1.01,1.095622444152832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,8,1,power_law_1.01,1.1438015937805175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,8,1,power_law_1.2,1.1589887619018555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,2688,1856,6,128,8,1,power_law_1.2,1.1658368110656738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,1,balanced,0.7810719807942709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,1,balanced,0.7819999853769938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,1,power_law_1.01,0.730841588973999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,1,power_law_1.01,0.7310656070709228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,1,power_law_1.2,0.7639039993286133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,1,power_law_1.2,0.7738624095916748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,128,balanced,0.14627200365066528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,128,balanced,0.14783466855684915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,128,power_law_1.01,0.14731520414352417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,128,power_law_1.01,0.14736000299453736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,128,power_law_1.2,0.1481152057647705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,128,power_law_1.2,0.14870400428771974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,16,balanced,0.19129600127538046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,16,balanced,0.19171732664108276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,16,power_law_1.01,0.18910080194473267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,16,power_law_1.01,0.1899839997291565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,16,power_law_1.2,0.19434239864349365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,16,power_law_1.2,0.1943935990333557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,2,balanced,0.4800106684366862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,2,balanced,0.4809226592381795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,2,power_law_1.01,0.4533247947692871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,2,power_law_1.01,0.464243221282959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,2,power_law_1.2,0.469542407989502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,2,power_law_1.2,0.47192959785461425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,256,balanced,0.14427199959754944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,256,balanced,0.1462613344192505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,256,power_law_1.01,0.14562560319900514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,256,power_law_1.01,0.14569599628448487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,256,power_law_1.2,0.14503040313720703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,256,power_law_1.2,0.1452288031578064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,32,balanced,0.1651573379834493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,32,balanced,0.1662826637427012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,32,power_law_1.01,0.16482559442520142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,32,power_law_1.01,0.16858240365982055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,32,power_law_1.2,0.168723201751709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,32,power_law_1.2,0.16967040300369263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,4,balanced,0.3216906587282817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,4,balanced,0.3218773404757182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,4,power_law_1.01,0.30684800148010255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,4,power_law_1.01,0.30833280086517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,4,power_law_1.2,0.3157504081726074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,4,power_law_1.2,0.3225023984909058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,64,balanced,0.151119997104009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,64,balanced,0.1520960032939911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,64,power_law_1.01,0.15011199712753295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,64,power_law_1.01,0.15202560424804687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,64,power_law_1.2,0.15374720096588135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,64,power_law_1.2,0.15555839538574218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,8,balanced,0.23490132888158163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,8,balanced,0.23578667640686035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,8,power_law_1.01,0.23130879402160645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,8,power_law_1.01,0.23171839714050294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,8,power_law_1.2,0.23463039398193358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,1,8,power_law_1.2,0.234771203994751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,16,1,balanced,0.1943839987119039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,16,1,balanced,0.19554666678110758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,16,1,power_law_1.01,0.18755840063095092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,16,1,power_law_1.01,0.18888319730758668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,16,1,power_law_1.2,0.1926911950111389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,16,1,power_law_1.2,0.19304959774017333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,2,1,balanced,0.46439464886983234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,2,1,balanced,0.46538134415944415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,2,1,power_law_1.01,0.4332736015319824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,2,1,power_law_1.01,0.437286376953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,2,1,power_law_1.2,0.4556863784790039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,2,1,power_law_1.2,0.4577023983001709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,32,1,balanced,0.1729066570599874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,32,1,balanced,0.1729546586672465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,32,1,power_law_1.01,0.16705280542373657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,32,1,power_law_1.01,0.16876159906387328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,32,1,power_law_1.2,0.17311999797821045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,32,1,power_law_1.2,0.17408000230789183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,4,1,balanced,0.3071039915084839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,4,1,balanced,0.3081546624501546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,4,1,power_law_1.01,0.28665599822998045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,4,1,power_law_1.01,0.288371205329895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,4,1,power_law_1.2,0.30236799716949464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,4,1,power_law_1.2,0.3030463933944702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,8,1,balanced,0.2326186696688334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,8,1,balanced,0.23429334163665771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,8,1,power_law_1.01,0.2250368118286133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,8,1,power_law_1.01,0.22566399574279786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,8,1,power_law_1.2,0.23225600719451905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,3072,1536,8,256,8,1,power_law_1.2,0.23226239681243896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,1,balanced,0.5724266767501831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,1,balanced,0.5749599933624268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,1,power_law_1.01,0.5847487926483155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,1,power_law_1.01,0.601632022857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,1,power_law_1.2,0.584716796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,1,power_law_1.2,0.5900224208831787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,2,balanced,0.32891732454299927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,2,balanced,0.32893866300582886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,2,power_law_1.01,0.4063680171966553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,2,power_law_1.01,0.41631360054016114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,2,power_law_1.2,0.34213759899139407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,2,power_law_1.2,0.40838398933410647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,4,balanced,0.25752000013987225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,4,balanced,0.25900799036026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,4,power_law_1.01,0.2792896032333374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,4,power_law_1.01,0.3030783891677856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,4,power_law_1.2,0.29999361038208006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,4,power_law_1.2,0.30556159019470214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,8,balanced,0.22323199113210043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,8,balanced,0.22456000248591104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,8,power_law_1.01,0.2696063995361328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,8,power_law_1.01,0.27100160121917727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,8,power_law_1.2,0.26632959842681886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,1,8,power_law_1.2,0.27413120269775393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,16,1,balanced,0.07653333246707916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,16,1,balanced,0.07773333291212718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,16,1,power_law_1.01,0.0756991982460022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,16,1,power_law_1.01,0.07622399926185608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,16,1,power_law_1.2,0.07618560194969178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,16,1,power_law_1.2,0.07703040242195129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,2,1,balanced,0.30109333992004395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,2,1,balanced,0.30110400915145874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,2,1,power_law_1.01,0.2989887952804565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,2,1,power_law_1.01,0.29944961071014403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,2,1,power_law_1.2,0.29616000652313235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,2,1,power_law_1.2,0.2984447956085205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,32,1,balanced,0.06216000020503998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,32,1,balanced,0.06401599943637848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,32,1,power_law_1.01,0.063372802734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,32,1,power_law_1.01,0.06439039707183838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,32,1,power_law_1.2,0.06485120058059693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,32,1,power_law_1.2,0.06505600214004517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,4,1,balanced,0.1732106606165568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,4,1,balanced,0.17510932683944702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,4,1,power_law_1.01,0.17045120000839234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,4,1,power_law_1.01,0.17581440210342408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,4,1,power_law_1.2,0.171942400932312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,4,1,power_law_1.2,0.17317119836807252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,8,1,balanced,0.1092693308989207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,8,1,balanced,0.10938666264216106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,8,1,power_law_1.01,0.10867840051651001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,8,1,power_law_1.01,0.10998400449752807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,8,1,power_law_1.2,0.11079679727554322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,14336,2,8,8,1,power_law_1.2,0.11125760078430176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,1,balanced,0.5557599862416586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,1,balanced,0.5571680068969727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,1,power_law_1.01,0.5765056133270263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,1,power_law_1.01,0.5850495815277099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,1,power_law_1.2,0.5953919887542725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,1,power_law_1.2,0.6010687828063965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,128,balanced,0.1295253336429596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,128,balanced,0.1297706663608551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,128,power_law_1.01,0.1306496024131775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,128,power_law_1.01,0.13320959806442262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,128,power_law_1.2,0.13370239734649658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,128,power_law_1.2,0.1348736047744751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,16,balanced,0.15465066830317178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,16,balanced,0.15636266271273294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,16,power_law_1.01,0.16705280542373657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,16,power_law_1.01,0.16949119567871093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,16,power_law_1.2,0.16869759559631348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,16,power_law_1.2,0.1737023949623108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,2,balanced,0.35500800609588623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,2,balanced,0.35502398014068604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,2,power_law_1.01,0.370195198059082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,2,power_law_1.01,0.38075520992279055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,2,power_law_1.2,0.37727999687194824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,2,power_law_1.2,0.3831935882568359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,32,balanced,0.13900799552599588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,32,balanced,0.13904533783594766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,32,power_law_1.01,0.14466559886932373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,32,power_law_1.01,0.1472383975982666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,32,power_law_1.2,0.14940160512924194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,32,power_law_1.2,0.15143680572509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,4,balanced,0.24451732635498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,4,balanced,0.2453333338101705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,4,power_law_1.01,0.25975680351257324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,4,power_law_1.01,0.2606208086013794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,4,power_law_1.2,0.26328320503234864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,4,power_law_1.2,0.2634495973587036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,64,balanced,0.13119999567667642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,64,balanced,0.13214932878812155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,64,power_law_1.01,0.13674880266189576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,64,power_law_1.01,0.13772159814834595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,64,power_law_1.2,0.13845759630203247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,64,power_law_1.2,0.13923840522766112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,8,balanced,0.1891253391901652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,8,balanced,0.18962132930755615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,8,power_law_1.01,0.19576319456100463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,8,power_law_1.01,0.19909119606018066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,8,power_law_1.2,0.2016319990158081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,1,8,power_law_1.2,0.20277760028839112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,16,1,balanced,0.1544533371925354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,16,1,balanced,0.15478932857513428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,16,1,power_law_1.01,0.16021759510040284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,16,1,power_law_1.01,0.1642303943634033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,16,1,power_law_1.2,0.1776128053665161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,16,1,power_law_1.2,0.17799680233001708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,2,1,balanced,0.34304531415303546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,2,1,balanced,0.34479467074076336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,2,1,power_law_1.01,0.35530240535736085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,2,1,power_law_1.01,0.3562943935394287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,2,1,power_law_1.2,0.36615040302276614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,2,1,power_law_1.2,0.3669503927230835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,32,1,balanced,0.14638400077819824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,32,1,balanced,0.1481706698735555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,32,1,power_law_1.01,0.15348479747772217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,32,1,power_law_1.01,0.15407999753952026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,32,1,power_law_1.2,0.15510400533676147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,32,1,power_law_1.2,0.15714559555053711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,4,1,balanced,0.2318506638209025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,4,1,balanced,0.23363200823465982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,4,1,power_law_1.01,0.23651840686798095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,4,1,power_law_1.01,0.24062080383300782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,4,1,power_law_1.2,0.2541887998580933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,4,1,power_law_1.2,0.2543423891067505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,8,1,balanced,0.1886026660601298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,8,1,balanced,0.18939733505249023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,8,1,power_law_1.01,0.19568639993667603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,8,1,power_law_1.01,0.19706239700317382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,8,1,power_law_1.2,0.19812480211257935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,1536,8,128,8,1,power_law_1.2,0.19893120527267455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,1,balanced,3.316549301147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,1,balanced,3.32637882232666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,1,power_law_1.01,3.286707305908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,1,power_law_1.01,3.414585494995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,1,power_law_1.2,3.39312629699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,1,power_law_1.2,3.70709114074707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,128,balanced,0.48309866587320965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,128,balanced,0.483733336130778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,128,power_law_1.01,0.49103360176086425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,128,power_law_1.01,0.49190402030944824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,128,power_law_1.2,0.4933504104614258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,128,power_law_1.2,0.4979263782501221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,16,balanced,0.6540266672770182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,16,balanced,0.655077338218689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,16,power_law_1.01,0.6598464012145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,16,power_law_1.01,0.6607808113098145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,16,power_law_1.2,0.6645055770874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,16,power_law_1.2,0.679475212097168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,2,balanced,1.9332000414530437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,2,balanced,1.9564213752746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,2,power_law_1.01,1.9130624771118163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,2,power_law_1.01,1.918604850769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,2,power_law_1.2,1.9869056701660157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,2,power_law_1.2,2.0130943298339843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,256,balanced,0.4740639925003052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,256,balanced,0.4742026726404826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,256,power_law_1.01,0.47863039970397947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,256,power_law_1.01,0.4796031951904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,256,power_law_1.2,0.4807231903076172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,256,power_law_1.2,0.48316159248352053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,32,balanced,0.5573013226191202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,32,balanced,0.5612320105234782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,32,power_law_1.01,0.5639808177947998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,32,power_law_1.01,0.5646912097930908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,32,power_law_1.2,0.5795904159545898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,32,power_law_1.2,0.580294418334961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,4,balanced,1.1990559895833333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,4,balanced,1.2005066871643066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,4,power_law_1.01,1.1986111640930175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,4,power_law_1.01,1.2060159683227538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,4,power_law_1.2,1.2214271545410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,4,power_law_1.2,1.245574378967285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,64,balanced,0.5130933523178101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,64,balanced,0.5141119956970215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,64,power_law_1.01,0.5179776191711426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,64,power_law_1.01,0.5204480171203614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,64,power_law_1.2,0.5200128078460693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,64,power_law_1.2,0.526316785812378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,8,balanced,0.8399626413981119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,8,balanced,0.8424692948659261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,8,power_law_1.01,0.8473407745361328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,8,power_law_1.01,0.8524607658386231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,8,power_law_1.2,0.8544832229614258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,1,8,power_law_1.2,0.8793408393859863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,16,1,balanced,5.7422027587890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,16,1,balanced,6.126101175944011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,16,1,power_law_1.01,6.16297607421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,16,1,power_law_1.01,6.2948158264160154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,16,1,power_law_1.2,6.389452743530273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,16,1,power_law_1.2,6.5384063720703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,2,1,balanced,1.8064319292704265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,2,1,balanced,1.9020479520161946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,2,1,power_law_1.01,1.8143552780151366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,2,1,power_law_1.01,1.8216127395629882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,2,1,power_law_1.2,1.8602048873901367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,2,1,power_law_1.2,1.8691007614135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,32,1,balanced,3.9985119501749673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,32,1,balanced,4.04585615793864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,32,1,power_law_1.01,4.111487960815429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,32,1,power_law_1.01,4.123270416259766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,32,1,power_law_1.2,4.275225448608398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,32,1,power_law_1.2,4.349990463256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,4,1,balanced,1.0980693499247234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,4,1,balanced,1.101637363433838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,4,1,power_law_1.01,1.104147243499756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,4,1,power_law_1.01,1.1082304000854493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,4,1,power_law_1.2,1.138047981262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,4,1,power_law_1.2,1.147366428375244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,8,1,balanced,0.7403093179066976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,8,1,balanced,0.7405280272165934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,8,1,power_law_1.01,0.7383488178253174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,8,1,power_law_1.01,0.7417664051055908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,8,1,power_law_1.2,0.7644544124603272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,4096,2688,22,512,8,1,power_law_1.2,0.7738368034362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,1,balanced,0.9295146465301514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,1,balanced,0.9341546694437662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,1,power_law_1.01,0.9462400436401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,1,power_law_1.01,0.978335952758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,1,power_law_1.2,0.9686143875122071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,1,power_law_1.2,0.9952832221984863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,2,balanced,0.5129973491032919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,2,balanced,0.521232008934021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,2,power_law_1.01,0.5708928108215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,2,power_law_1.01,0.5970240116119385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,2,power_law_1.2,0.5680255889892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,2,power_law_1.2,0.6143167972564697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,4,balanced,0.3290506601333618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,4,balanced,0.3338666756947835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,4,power_law_1.01,0.4286464214324951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,4,power_law_1.01,0.4418752193450928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,4,power_law_1.2,0.4507455825805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,4,power_law_1.2,0.4525887966156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,8,balanced,0.2753653327624003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,8,balanced,0.28068800767262775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,8,power_law_1.01,0.3337088108062744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,8,power_law_1.01,0.34796159267425536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,8,power_law_1.2,0.3377984046936035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,1,8,power_law_1.2,0.34744958877563475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,16,1,balanced,0.1032373309135437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,16,1,balanced,0.10390399893124898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,16,1,power_law_1.01,0.10293760299682617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,16,1,power_law_1.01,0.10386559963226319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,16,1,power_law_1.2,0.1035264015197754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,16,1,power_law_1.2,0.10451200008392333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,2,1,balanced,0.44843733310699463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,2,1,balanced,0.45369601249694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,2,1,power_law_1.01,0.4864192008972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,2,1,power_law_1.01,0.4987840175628662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,2,1,power_law_1.2,0.48088321685791013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,2,1,power_law_1.2,0.49259519577026367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,32,1,balanced,0.08892800410588582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,32,1,balanced,0.08936533331871033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,32,1,power_law_1.01,0.08883200287818908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,32,1,power_law_1.01,0.0890175998210907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,32,1,power_law_1.2,0.08776959776878357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,32,1,power_law_1.2,0.0881600022315979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,4,1,balanced,0.25336533784866333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,4,1,balanced,0.2568853298823039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,4,1,power_law_1.01,0.25511679649353025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,4,1,power_law_1.01,0.2553663969039917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,4,1,power_law_1.2,0.2588288068771362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,4,1,power_law_1.2,0.25899519920349123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,8,1,balanced,0.15557333827018738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,8,1,balanced,0.15572800238927206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,8,1,power_law_1.01,0.15253759622573854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,8,1,power_law_1.01,0.1539903998374939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,8,1,power_law_1.2,0.1532415986061096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,16384,2,8,8,1,power_law_1.2,0.15372159481048583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,1,balanced,1.8931253751118977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,1,balanced,2.0437280337015786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,1,power_law_1.01,1.7756671905517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,1,power_law_1.01,1.7893184661865233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,1,power_law_1.2,1.841107177734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,1,power_law_1.2,1.8474687576293944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,128,balanced,0.23253333568572998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,128,balanced,0.23428267240524292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,128,power_law_1.01,0.23471360206604003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,128,power_law_1.01,0.23786239624023436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,128,power_law_1.2,0.23768320083618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,128,power_law_1.2,0.2396672010421753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,16,balanced,0.33477866649627686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,16,balanced,0.3354453245798747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,16,power_law_1.01,0.32854399681091306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,16,power_law_1.01,0.33022079467773435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,16,power_law_1.2,0.3448064088821411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,16,power_law_1.2,0.3466559886932373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,2,balanced,1.0784906546274822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,2,balanced,1.0811093648274739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,2,power_law_1.01,1.0084992408752442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,2,power_law_1.01,1.0308735847473145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,2,power_law_1.2,1.0556415557861327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,2,power_law_1.2,1.0840576171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,256,balanced,0.22588266928990683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,256,balanced,0.22612800200780234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,256,power_law_1.01,0.2278143882751465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,256,power_law_1.01,0.22931199073791503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,256,power_law_1.2,0.2299583911895752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,256,power_law_1.2,0.23192319869995118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,32,balanced,0.2811093330383301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,32,balanced,0.2826346755027771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,32,power_law_1.01,0.28324480056762696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,32,power_law_1.01,0.28389759063720704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,32,power_law_1.2,0.28917760848999025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,32,power_law_1.2,0.29111039638519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,4,balanced,0.6605439980824789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,4,balanced,0.6614506642023722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,4,power_law_1.01,0.6296000003814697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,4,power_law_1.01,0.6311999797821045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,4,power_law_1.2,0.6517695903778076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,4,power_law_1.2,0.6593408107757568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,64,balanced,0.24734399716059366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,64,balanced,0.24819733699162802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,64,power_law_1.01,0.24939520359039308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,64,power_law_1.01,0.25045759677886964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,64,power_law_1.2,0.2548095941543579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,64,power_law_1.2,0.25535359382629397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,8,balanced,0.44438934326171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,8,balanced,0.44576001167297363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,8,power_law_1.01,0.42592639923095704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,8,power_law_1.01,0.4356736183166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,8,power_law_1.2,0.44915199279785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,1,8,power_law_1.2,0.44958720207214353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,16,1,balanced,0.3509440024693807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,16,1,balanced,0.35257601737976074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,16,1,power_law_1.01,0.338809609413147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,16,1,power_law_1.01,0.33968000411987304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,16,1,power_law_1.2,0.35226240158081057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,16,1,power_law_1.2,0.35228800773620605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,2,1,balanced,1.0547359784444172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,2,1,balanced,1.0567999680836995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,2,1,power_law_1.01,0.9880064010620118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,2,1,power_law_1.01,0.99551362991333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,2,1,power_law_1.2,1.023475170135498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,2,1,power_law_1.2,1.026591968536377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,32,1,balanced,0.3107626636823018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,32,1,balanced,0.3119093378384908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,32,1,power_law_1.01,0.30259840488433837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,32,1,power_law_1.01,0.30714240074157717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,32,1,power_law_1.2,0.309881591796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,32,1,power_law_1.2,0.31293439865112305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,4,1,balanced,0.641759991645813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,4,1,balanced,0.6418933471043905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,4,1,power_law_1.01,0.6129920005798339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,4,1,power_law_1.01,0.6131072044372559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,4,1,power_law_1.2,0.6330175876617432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,4,1,power_law_1.2,0.643225622177124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,8,1,balanced,0.45459731419881183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,8,1,balanced,0.4546346664428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,8,1,power_law_1.01,0.4357503890991211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,8,1,power_law_1.01,0.4398848056793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,8,1,power_law_1.2,0.4516608238220215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2048,8,256,8,1,power_law_1.2,0.45314559936523435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,1,balanced,1.5518399874369304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,1,balanced,1.564890702565511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,1,power_law_1.01,1.5182527542114257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,1,power_law_1.01,1.548198413848877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,1,power_law_1.2,1.5903871536254883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,1,power_law_1.2,1.6012351989746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,16,balanced,0.28628265857696533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,16,balanced,0.2864533265431722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,16,power_law_1.01,0.29490559101104735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,16,power_law_1.01,0.3009471893310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,16,power_law_1.2,0.31249279975891114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,16,power_law_1.2,0.3126015901565552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,2,balanced,0.8659733136494955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,2,balanced,0.8673120339711508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,2,power_law_1.01,0.8568256378173829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,2,power_law_1.01,0.8883647918701172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,2,power_law_1.2,0.9047743797302246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,2,power_law_1.2,0.9092672348022461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,32,balanced,0.24010133743286133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,32,balanced,0.24014933904012045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,32,power_law_1.01,0.2545344114303589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,32,power_law_1.01,0.2567231893539429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,32,power_law_1.2,0.2575808048248291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,32,power_law_1.2,0.26257920265197754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,4,balanced,0.5366559823354086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,4,balanced,0.5381919940312704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,4,power_law_1.01,0.5540671825408936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,4,power_law_1.01,0.5545919895172119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,4,power_law_1.2,0.5702784061431885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,4,power_law_1.2,0.575110387802124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,8,balanced,0.3721333344777425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,8,balanced,0.37360533078511554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,8,power_law_1.01,0.3855168104171753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,8,power_law_1.01,0.386028790473938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,8,power_law_1.2,0.39127678871154786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,1,8,power_law_1.2,0.3965440034866333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,16,1,balanced,0.28895999987920123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,16,1,balanced,0.2895093361536662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,16,1,power_law_1.01,0.295795202255249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,16,1,power_law_1.01,0.29663360118865967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,16,1,power_law_1.2,0.300166392326355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,16,1,power_law_1.2,0.3007551908493042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,2,1,balanced,0.8358720143636068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,2,1,balanced,0.8369173208872477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,2,1,power_law_1.01,0.8579008102416992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,2,1,power_law_1.01,0.8603263854980469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,2,1,power_law_1.2,0.8768256187438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,2,1,power_law_1.2,0.884671974182129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,32,1,balanced,0.2626346747080485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,32,1,balanced,0.26342932383219403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,32,1,power_law_1.01,0.27149438858032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,32,1,power_law_1.01,0.2724287986755371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,32,1,power_law_1.2,0.27457280158996583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,32,1,power_law_1.2,0.2761087894439697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,4,1,balanced,0.5148106813430786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,4,1,balanced,0.5151946544647217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,4,1,power_law_1.01,0.5162879943847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,4,1,power_law_1.01,0.5220287799835205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,4,1,power_law_1.2,0.5466368198394775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,4,1,power_law_1.2,0.5474239826202393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,8,1,balanced,0.3500639994939168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,8,1,balanced,0.3503520091374715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,8,1,power_law_1.01,0.3572351932525635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,8,1,power_law_1.01,0.3574975967407227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,8,1,power_law_1.2,0.3740799903869629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,6144,2560,8,160,8,1,power_law_1.2,0.37651839256286623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,1,balanced,2.1913599967956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,1,balanced,2.2004853884379068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,1,power_law_1.01,2.0346048355102537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,1,power_law_1.01,2.142969512939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,1,power_law_1.2,2.141299247741699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,1,power_law_1.2,2.195705604553223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,128,balanced,0.25692800680796307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,128,balanced,0.2574080030123393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,128,power_law_1.01,0.25842559337615967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,128,power_law_1.01,0.26138880252838137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,128,power_law_1.2,0.26257920265197754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,128,power_law_1.2,0.2631040096282959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,16,balanced,0.3752319812774658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,16,balanced,0.37668800354003906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,16,power_law_1.01,0.37170560359954835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,16,power_law_1.01,0.37457919120788574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,16,power_law_1.2,0.3787904024124146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,16,power_law_1.2,0.38172800540924073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,2,balanced,1.237925370534261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,2,balanced,1.2391200065612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,2,power_law_1.01,1.171168041229248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,2,power_law_1.01,1.1835136413574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,2,power_law_1.2,1.2108799934387207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,2,power_law_1.2,1.2160191535949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,256,balanced,0.25065066417058307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,256,balanced,0.25227733453114826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,256,power_law_1.01,0.2527872085571289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,256,power_law_1.01,0.2536448001861572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,256,power_law_1.2,0.25357439517974856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,256,power_law_1.2,0.2568192005157471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,32,balanced,0.30966933568318683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,32,balanced,0.3103626569112142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,32,power_law_1.01,0.30716800689697266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,32,power_law_1.01,0.31076478958129883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,32,power_law_1.2,0.31877760887145995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,32,power_law_1.2,0.3219327926635742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,4,balanced,0.7509760061899821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,4,balanced,0.7514879703521729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,4,power_law_1.01,0.7134592056274414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,4,power_law_1.01,0.7204351902008057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,4,power_law_1.2,0.7407807826995849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,4,power_law_1.2,0.7495488166809082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,64,balanced,0.27115732431411743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,64,balanced,0.27296533187230426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,64,power_law_1.01,0.2739903926849365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,64,power_law_1.01,0.27686400413513185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,64,power_law_1.2,0.27703680992126467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,64,power_law_1.2,0.28176639080047605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,8,balanced,0.5018506844838461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,8,balanced,0.5021546681722006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,8,power_law_1.01,0.4916287899017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,8,power_law_1.01,0.49713921546936035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,8,power_law_1.2,0.4971007823944092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,1,8,power_law_1.2,0.5071040153503418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,16,1,balanced,0.4017599821090698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,16,1,balanced,0.40270400047302246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,16,1,power_law_1.01,0.3916800022125244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,16,1,power_law_1.01,0.3952960014343262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,16,1,power_law_1.2,0.40430078506469724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,16,1,power_law_1.2,0.4046783924102783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,2,1,balanced,1.2248053550720215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,2,1,balanced,1.2356106440226238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,2,1,power_law_1.01,1.1263872146606446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,2,1,power_law_1.01,1.1425151824951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,2,1,power_law_1.2,1.1895744323730468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,2,1,power_law_1.2,1.1964287757873535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,32,1,balanced,0.3550293445587158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,32,1,balanced,0.3570559819539388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,32,1,power_law_1.01,0.34180479049682616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,32,1,power_law_1.01,0.34403200149536134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,32,1,power_law_1.2,0.3557760000228882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,32,1,power_law_1.2,0.35681920051574706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,4,1,balanced,0.7381866772969564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,4,1,balanced,0.7396000226338705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,4,1,power_law_1.01,0.7052544116973877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,4,1,power_law_1.01,0.7109824180603027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,4,1,power_law_1.2,0.7289535999298096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,4,1,power_law_1.2,0.731167984008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,8,1,balanced,0.5221226612726847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,8,1,balanced,0.5240373214085897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,8,1,power_law_1.01,0.5024384021759033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,8,1,power_law_1.01,0.5046080112457275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,8,1,power_law_1.2,0.5181248188018799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,256,8,1,power_law_1.2,0.5193215847015381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,1,balanced,3.522101402282715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,1,balanced,3.5303786595662436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,1,power_law_1.01,2.853683280944824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,1,power_law_1.01,2.8620159149169924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,1,power_law_1.2,2.8537151336669924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,1,power_law_1.2,2.967923164367676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,128,balanced,0.3218453327814738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,128,balanced,0.32210665941238403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,128,power_law_1.01,0.31877119541168214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,128,power_law_1.01,0.31905279159545896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,128,power_law_1.2,0.3229439973831177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,128,power_law_1.2,0.3239295959472656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,16,balanced,0.49295465151468915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,16,balanced,0.4939359823862712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,16,power_law_1.01,0.479750394821167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,16,power_law_1.01,0.48233599662780763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,16,power_law_1.2,0.4753471851348877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,16,power_law_1.2,0.47739520072937014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,2,balanced,1.7814559936523438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,2,balanced,1.8079573313395183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,2,power_law_1.01,1.571993637084961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,2,power_law_1.01,1.59039363861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,2,power_law_1.2,1.5798463821411133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,2,power_law_1.2,1.6476608276367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,32,balanced,0.40033066272735596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,32,balanced,0.4013813336690267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,32,power_law_1.01,0.390828800201416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,32,power_law_1.01,0.396396803855896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,32,power_law_1.2,0.3946880102157593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,32,power_law_1.2,0.3987776041030884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,4,balanced,1.0491360028584797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,4,balanced,1.0508000055948894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,4,power_law_1.01,0.9472448348999023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,4,power_law_1.01,0.9602304458618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,4,power_law_1.2,0.9599040031433106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,4,power_law_1.2,0.9605440139770508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,64,balanced,0.3486186663309733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,64,balanced,0.34994133313496906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,64,power_law_1.01,0.3426815986633301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,64,power_law_1.01,0.3452415943145752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,64,power_law_1.2,0.3492799997329712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,64,power_law_1.2,0.34983038902282715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,8,balanced,0.6845599810282389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,8,balanced,0.6872159639994303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,8,power_law_1.01,0.6326399803161621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,8,power_law_1.01,0.6543680191040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,8,power_law_1.2,0.6550591945648193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,1,8,power_law_1.2,0.6557055950164795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,16,1,balanced,0.5646346807479858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,16,1,balanced,0.565994660059611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,16,1,power_law_1.01,0.522822380065918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,16,1,power_law_1.01,0.524070405960083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,16,1,power_law_1.2,0.5286528110504151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,16,1,power_law_1.2,0.5323584079742432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,2,1,balanced,1.796005407969157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,2,1,balanced,1.8923786481221516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,2,1,power_law_1.01,1.5365119934082032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,2,1,power_law_1.01,1.5575103759765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,2,1,power_law_1.2,1.5628864288330078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,2,1,power_law_1.2,1.5638336181640624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,32,1,balanced,0.5081813335418701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,32,1,balanced,0.5092159907023112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,32,1,power_law_1.01,0.46956801414489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,32,1,power_law_1.01,0.4708672046661377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,32,1,power_law_1.2,0.47547521591186526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,32,1,power_law_1.2,0.47820158004760743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,4,1,balanced,1.0705706278483074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,4,1,balanced,1.0712160269419353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,4,1,power_law_1.01,0.9400896072387696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,4,1,power_law_1.01,0.9564607620239258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,4,1,power_law_1.2,0.9636544227600098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,4,1,power_law_1.2,0.9757120132446289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,8,1,balanced,0.7404747009277344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,8,1,balanced,0.7415733337402344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,8,1,power_law_1.01,0.6556032180786133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,8,1,power_law_1.01,0.6566463947296143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,8,1,power_law_1.2,0.666156816482544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,768,7168,2048,8,384,8,1,power_law_1.2,0.6670207977294922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,1,balanced,0.08413333694140117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,1,balanced,0.08458133538564046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,1,power_law_1.01,0.07330560088157653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,1,power_law_1.01,0.0739135980606079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,1,power_law_1.2,0.06498559713363647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,1,power_law_1.2,0.06799359917640686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,128,balanced,0.027589333554108936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,128,balanced,0.027690666417280834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,128,power_law_1.01,0.02720000147819519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,128,power_law_1.01,0.027897599339485168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,128,power_law_1.2,0.027014398574829103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,128,power_law_1.2,0.02739199995994568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,16,balanced,0.029178666571776073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,16,balanced,0.029765332738558452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,16,power_law_1.01,0.02993279993534088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,16,power_law_1.01,0.03089280128479004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,16,power_law_1.2,0.029023998975753786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,16,power_law_1.2,0.030803200602531434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,2,balanced,0.057461331288019814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,2,balanced,0.058090666929880776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,2,power_law_1.01,0.05203840136528015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,2,power_law_1.01,0.05509120225906372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,2,power_law_1.2,0.04842880070209503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,2,power_law_1.2,0.05056639909744263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,32,balanced,0.029274667302767437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,32,balanced,0.02943466603755951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,32,power_law_1.01,0.027532801032066345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,32,power_law_1.01,0.027846398949623107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,32,power_law_1.2,0.02808319926261902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,32,power_law_1.2,0.028115200996398925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,4,balanced,0.03845866769552231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,4,balanced,0.04040000090996424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,4,power_law_1.01,0.04352000057697296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,4,power_law_1.01,0.044972801208496095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,4,power_law_1.2,0.038815999031066896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,4,power_law_1.2,0.03896960020065308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,64,balanced,0.027189334233601887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,64,balanced,0.02740799884001414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,64,power_law_1.01,0.02707839906215668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,64,power_law_1.01,0.027142399549484254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,64,power_law_1.2,0.027430400252342224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,64,power_law_1.2,0.027795198559761047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,8,balanced,0.03324266771475474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,8,balanced,0.03334933271010717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,8,power_law_1.01,0.03591040074825287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,8,power_law_1.01,0.036185601353645326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,8,power_law_1.2,0.03716480135917664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,1,8,power_law_1.2,0.03731839954853058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,2,1,balanced,0.05497066676616669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,2,1,balanced,0.056032001972198486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,2,1,power_law_1.01,0.04824320077896118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,2,1,power_law_1.01,0.04837760031223297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,2,1,power_law_1.2,0.04612480103969574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,2,1,power_law_1.2,0.04665600061416626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,4,1,balanced,0.03975466638803482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,4,1,balanced,0.03982399900754293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,4,1,power_law_1.01,0.03681919872760773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,4,1,power_law_1.01,0.03749119937419891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,4,1,power_law_1.2,0.03568640053272247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2048,768,8,128,4,1,power_law_1.2,0.03640320003032684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,1,balanced,0.1465226709842682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,1,balanced,0.14726932843526205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,1,power_law_1.01,0.12933759689331054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,1,power_law_1.01,0.13192319869995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,1,power_law_1.2,0.12139519453048705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,1,power_law_1.2,0.12492799758911133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,128,balanced,0.03138133386770884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,128,balanced,0.03330666571855545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,128,power_law_1.01,0.030752000212669373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,128,power_law_1.01,0.031590399146080014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,128,power_law_1.2,0.031206399202346802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,128,power_law_1.2,0.03146879971027374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,16,balanced,0.037632000943024956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,16,balanced,0.0377866675456365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,16,power_law_1.01,0.04707840085029602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,16,power_law_1.01,0.050457602739334105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,16,power_law_1.2,0.05095679759979248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,16,power_law_1.2,0.05098239779472351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,2,balanced,0.09891200065612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,2,balanced,0.10161599516868591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,2,power_law_1.01,0.09426559805870056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,2,power_law_1.01,0.1018496036529541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,2,power_law_1.2,0.09271039962768554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,2,power_law_1.2,0.09552639722824097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,32,balanced,0.03532266616821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,32,balanced,0.03562133262554804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,32,power_law_1.01,0.03445119857788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,32,power_law_1.01,0.0355648010969162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,32,power_law_1.2,0.035308799147605895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,32,power_law_1.2,0.03570559918880463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,4,balanced,0.06529599924882253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,4,balanced,0.06630399823188782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,4,power_law_1.01,0.07407360076904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,4,power_law_1.01,0.07912960052490234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,4,power_law_1.2,0.06862080097198486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,4,power_law_1.2,0.07191039919853211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,64,balanced,0.033759998778502144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,64,balanced,0.03565866748491923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,64,power_law_1.01,0.032627201080322264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,64,power_law_1.01,0.03365119993686676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,64,power_law_1.2,0.03327359855175018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,64,power_law_1.2,0.033932799100875856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,8,balanced,0.04860266546408335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,8,balanced,0.05055999755859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,8,power_law_1.01,0.059411197900772095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,8,power_law_1.01,0.05988479852676391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,8,power_law_1.2,0.06104959845542908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,1,8,power_law_1.2,0.06878719925880432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,16,1,balanced,0.09092799822489421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,16,1,balanced,0.09175466497739156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,16,1,power_law_1.01,0.08342400193214417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,16,1,power_law_1.01,0.08533120155334473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,16,1,power_law_1.2,0.08171520233154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,16,1,power_law_1.2,0.08204799890518188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,2,1,balanced,0.09717333316802979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,2,1,balanced,0.09735999504725139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,2,1,power_law_1.01,0.08634880185127258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,2,1,power_law_1.01,0.0871999979019165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,2,1,power_law_1.2,0.07776640057563781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,2,1,power_law_1.2,0.08284800052642823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,32,1,balanced,0.0867039958635966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,32,1,balanced,0.0867680013179779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,32,1,power_law_1.01,0.0785152018070221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,32,1,power_law_1.01,0.08121600151062011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,32,1,power_law_1.2,0.07285119891166687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,32,1,power_law_1.2,0.07315840125083924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,4,1,balanced,0.06404266754786174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,4,1,balanced,0.06474666794141133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,4,1,power_law_1.01,0.05607039928436279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,4,1,power_law_1.01,0.056480002403259275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,4,1,power_law_1.2,0.05493119955062866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,4,1,power_law_1.2,0.056959998607635495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,8,1,balanced,0.10913599530855815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,8,1,balanced,0.1093280017375946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,8,1,power_law_1.01,0.10028799772262573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,8,1,power_law_1.01,0.10098559856414795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,8,1,power_law_1.2,0.09337599873542786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,2688,1856,6,128,8,1,power_law_1.2,0.09519360065460206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,1,balanced,0.1731040080388387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,1,balanced,0.19273066520690918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,1,power_law_1.01,0.16857600212097168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,1,power_law_1.01,0.16998399496078492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,1,power_law_1.2,0.16043519973754883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,1,power_law_1.2,0.16115200519561768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,128,balanced,0.031311998764673867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,128,balanced,0.031514666974544525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,128,power_law_1.01,0.030713599920272828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,128,power_law_1.01,0.030873599648475646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,128,power_law_1.2,0.031020799279212953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,128,power_law_1.2,0.03112959861755371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,16,balanced,0.03583999971548716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,16,balanced,0.0373279998699824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,16,power_law_1.01,0.06711680293083191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,16,power_law_1.01,0.07123839855194092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,16,power_law_1.2,0.06851840019226074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,16,power_law_1.2,0.07196159958839417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,2,balanced,0.11348799864451091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,2,balanced,0.114138662815094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,2,power_law_1.01,0.12254719734191895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,2,power_law_1.01,0.125600004196167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,2,power_law_1.2,0.11274240016937256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,2,power_law_1.2,0.11713279485702514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,256,balanced,0.03159466634194056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,256,balanced,0.03224000086386999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,256,power_law_1.01,0.030380800366401672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,256,power_law_1.01,0.03043839931488037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,256,power_law_1.2,0.03031040132045746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,256,power_law_1.2,0.030803200602531434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,32,balanced,0.031770666440327965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,32,balanced,0.03178666780392329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,32,power_law_1.01,0.051583999395370485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,32,power_law_1.01,0.05211520195007324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,32,power_law_1.2,0.050291198492050174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,32,power_law_1.2,0.051097601652145386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,4,balanced,0.07213333249092102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,4,balanced,0.07421333094437917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,4,power_law_1.01,0.10510720014572143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,4,power_law_1.01,0.10737919807434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,4,power_law_1.2,0.09531520009040832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,4,power_law_1.2,0.09919360280036926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,64,balanced,0.031557333966096245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,64,balanced,0.0334346666932106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,64,power_law_1.01,0.03470720052719116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,64,power_law_1.01,0.03526400029659271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,64,power_law_1.2,0.03459199965000152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,64,power_law_1.2,0.03570559918880463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,8,balanced,0.05014933149019877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,8,balanced,0.054085334142049156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,8,power_law_1.01,0.0834879994392395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,8,power_law_1.01,0.09223679900169372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,8,power_law_1.2,0.0865664005279541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,1,8,power_law_1.2,0.09150720238685608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,16,1,balanced,0.03576533248027166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,16,1,balanced,0.03722133239110311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,16,1,power_law_1.01,0.03768959939479828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,16,1,power_law_1.01,0.03808639943599701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,16,1,power_law_1.2,0.03769600093364715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,16,1,power_law_1.2,0.037913599610328676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,2,1,balanced,0.1034986674785614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,2,1,balanced,0.10382933417956035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,2,1,power_law_1.01,0.10032639503479004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,2,1,power_law_1.01,0.11359360218048095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,2,1,power_law_1.2,0.09682559967041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,32,1,balanced,0.031871999303499855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,32,1,balanced,0.03334933271010717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,32,1,power_law_1.01,0.03359360098838806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,32,1,power_law_1.01,0.03441919982433319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,32,1,power_law_1.2,0.03399679958820343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,32,1,power_law_1.2,0.03491199910640717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,4,1,balanced,0.06621333460013072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,4,1,balanced,0.06704533100128174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,4,1,power_law_1.01,0.06462720036506653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,4,1,power_law_1.01,0.06570240259170532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,4,1,power_law_1.2,0.06155520081520081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,4,1,power_law_1.2,0.06198400259017944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,8,1,balanced,0.04726399978001913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,8,1,balanced,0.047983999053637184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,8,1,power_law_1.01,0.04645760059356689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,8,1,power_law_1.01,0.05707520246505737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,8,1,power_law_1.2,0.04556800127029419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,3072,1536,8,256,8,1,power_law_1.2,0.04576640129089356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,1,balanced,0.25682665904362995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,1,balanced,0.2574719985326131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,1,power_law_1.01,0.24364800453186036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,1,power_law_1.01,0.25055360794067383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,1,power_law_1.2,0.24638719558715821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,1,power_law_1.2,0.2535360097885132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,2,balanced,0.17492266496022543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,2,balanced,0.18687466780344644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,2,power_law_1.01,0.15993599891662597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,2,power_law_1.01,0.1601408004760742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,2,power_law_1.2,0.15892479419708253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,2,power_law_1.2,0.16687999963760375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,4,balanced,0.11307733257611592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,4,balanced,0.11496000488599141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,4,power_law_1.01,0.10985599756240845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,4,power_law_1.01,0.11207040548324584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,4,power_law_1.2,0.111353600025177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,4,power_law_1.2,0.11545599699020385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,8,balanced,0.08685333530108134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,8,balanced,0.09327999750773112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,8,power_law_1.01,0.08586239814758301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,8,power_law_1.01,0.08602880239486695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,8,power_law_1.2,0.08550400137901307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,1,8,power_law_1.2,0.08603519797325135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,16,1,balanced,0.03549866626660029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,16,1,balanced,0.03770133356253306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,16,1,power_law_1.01,0.036287999153137206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,16,1,power_law_1.01,0.03704319894313812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,16,1,power_law_1.2,0.035743999481201175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,16,1,power_law_1.2,0.03591040074825287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,2,1,balanced,0.1458080013593038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,2,1,balanced,0.15582933028539023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,2,1,power_law_1.01,0.1380735993385315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,2,1,power_law_1.01,0.14011520147323608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,2,1,power_law_1.2,0.13980159759521485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,2,1,power_law_1.2,0.1422976016998291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,32,1,balanced,0.02938666691382726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,32,1,balanced,0.03033600002527237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,32,1,power_law_1.01,0.028672000765800475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,32,1,power_law_1.01,0.029068800806999206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,32,1,power_law_1.2,0.028672000765800475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,32,1,power_law_1.2,0.029049599170684816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,4,1,balanced,0.08478400111198425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,4,1,balanced,0.08630933364232381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,4,1,power_law_1.01,0.08073599934577942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,4,1,power_law_1.01,0.08260480165481568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,4,1,power_law_1.2,0.07949439883232116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,4,1,power_law_1.2,0.08006399869918823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,8,1,balanced,0.05798399945100149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,8,1,balanced,0.05799466868241628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,8,1,power_law_1.01,0.053548800945281985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,8,1,power_law_1.01,0.05431680083274841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,8,1,power_law_1.2,0.052249598503112796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,14336,2,8,8,1,power_law_1.2,0.056505602598190305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,1,balanced,0.2212373415629069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,1,balanced,0.22533865769704184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,1,power_law_1.01,0.17246079444885254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,1,power_law_1.01,0.17857279777526855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,1,power_law_1.2,0.16049280166625976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,1,power_law_1.2,0.16750719547271728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,128,balanced,0.03345066557327906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,128,balanced,0.033786666889985405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,128,power_law_1.01,0.03278720080852508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,128,power_law_1.01,0.032793599367141726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,128,power_law_1.2,0.03219200074672699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,128,power_law_1.2,0.032262399792671204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,16,balanced,0.04174399872620901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,16,balanced,0.04358399907747904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,16,power_law_1.01,0.05400320291519165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,16,power_law_1.01,0.05826560258865356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,16,power_law_1.2,0.04860160052776337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,16,power_law_1.2,0.05287039875984192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,2,balanced,0.1363093356291453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,2,balanced,0.13806399703025818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,2,power_law_1.01,0.1253056049346924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,2,power_law_1.01,0.12569600343704224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,2,power_law_1.2,0.1232192039489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,2,power_law_1.2,0.1279360055923462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,32,balanced,0.035386666655540466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,32,balanced,0.0367999995748202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,32,power_law_1.01,0.03842560052871704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,32,power_law_1.01,0.039647999405860904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,32,power_law_1.2,0.03800959885120392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,32,power_law_1.2,0.03945600092411041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,4,balanced,0.08247999846935272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,4,balanced,0.0836906631787618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,4,power_law_1.01,0.08663039803504943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,4,power_law_1.01,0.09464319944381713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,4,power_law_1.2,0.08944000005722046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,4,power_law_1.2,0.09461119771003723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,64,balanced,0.03332799921433131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,64,balanced,0.03357866654793421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,64,power_law_1.01,0.033555200695991515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,64,power_law_1.01,0.03380480110645294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,64,power_law_1.2,0.033139199018478394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,64,power_law_1.2,0.033548799157142636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,8,balanced,0.05965333183606466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,8,balanced,0.06197333335876465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,8,power_law_1.01,0.07577599883079529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,8,power_law_1.01,0.07804160118103028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,8,power_law_1.2,0.06922879815101624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,1,8,power_law_1.2,0.07219840288162231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,16,1,balanced,0.047082667549451195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,16,1,balanced,0.04763199885686239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,16,1,power_law_1.01,0.04403199851512909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,16,1,power_law_1.01,0.04425599873065948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,16,1,power_law_1.2,0.04154239892959595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,16,1,power_law_1.2,0.041657599806785586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,2,1,balanced,0.13461866974830627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,2,1,balanced,0.1355413297812144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,2,1,power_law_1.01,0.11345280408859253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,2,1,power_law_1.01,0.11747839450836181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,2,1,power_law_1.2,0.10085120201110839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,2,1,power_law_1.2,0.10771199464797973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,32,1,balanced,0.04161066561937332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,32,1,balanced,0.04288533329963684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,32,1,power_law_1.01,0.03825919926166534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,32,1,power_law_1.01,0.039827200770378116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,32,1,power_law_1.2,0.03678719997406006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,32,1,power_law_1.2,0.03818880021572113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,4,1,balanced,0.08501866459846497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,4,1,balanced,0.0867680013179779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,4,1,power_law_1.01,0.06826879978179931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,4,1,power_law_1.01,0.06908159852027893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,4,1,power_law_1.2,0.06584960222244263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,4,1,power_law_1.2,0.06639360189437866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,8,1,balanced,0.06226666768391927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,8,1,balanced,0.06234133243560791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,8,1,power_law_1.01,0.052876800298690796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,8,1,power_law_1.01,0.05505920052528381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,8,1,power_law_1.2,0.04995200037956238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,1536,8,128,8,1,power_law_1.2,0.05000960230827332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,1,balanced,0.9156800111134847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,1,balanced,0.9190346399943033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,1,power_law_1.01,0.8150015830993652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,1,power_law_1.01,0.8240127563476562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,1,power_law_1.2,0.7289919853210449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,1,power_law_1.2,0.740505599975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,128,balanced,0.055760001142819725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,128,balanced,0.05782400071620941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,128,power_law_1.01,0.05973119735717773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,128,power_law_1.01,0.06048640012741089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,128,power_law_1.2,0.05446400046348572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,128,power_law_1.2,0.05717759728431702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,16,balanced,0.13844266533851624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,16,balanced,0.139984001715978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,16,power_law_1.01,0.20631039142608643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,16,power_law_1.01,0.20804479122161865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,16,power_law_1.2,0.20798718929290771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,16,power_law_1.2,0.20799360275268555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,2,balanced,0.4984853267669678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,2,balanced,0.5007413228352865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,2,power_law_1.01,0.5119040012359619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,2,power_law_1.01,0.5166719913482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,2,power_law_1.2,0.44879999160766604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,2,power_law_1.2,0.4927999973297119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,256,balanced,0.04780266682306925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,256,balanced,0.047925333182017006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,256,power_law_1.01,0.04644480049610138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,256,power_law_1.01,0.04671359956264496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,256,power_law_1.2,0.04576640129089356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,256,power_law_1.2,0.0462336003780365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,32,balanced,0.09775466720263164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,32,balanced,0.0990826686223348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,32,power_law_1.01,0.1351040005683899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,32,power_law_1.01,0.1368384003639221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,32,power_law_1.2,0.1359935998916626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,32,power_law_1.2,0.13637759685516357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,4,balanced,0.28963200251261395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,4,balanced,0.29314132531483966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,4,power_law_1.01,0.3592063903808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,4,power_law_1.01,0.3671679973602295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,4,power_law_1.2,0.3380095958709717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,4,power_law_1.2,0.36718719005584716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,64,balanced,0.07235733171304067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,64,balanced,0.0757013310988744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,64,power_law_1.01,0.0787775993347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,64,power_law_1.01,0.0807807981967926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,64,power_law_1.2,0.07870079874992371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,64,power_law_1.2,0.08081279993057251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,8,balanced,0.18677333990732828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,8,balanced,0.18835733334223428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,8,power_law_1.01,0.27567999362945556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,8,power_law_1.01,0.28716800212860105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,8,power_law_1.2,0.28090240955352785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,1,8,power_law_1.2,0.2818176031112671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,16,1,balanced,0.4896373351414998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,16,1,balanced,0.4896639982859294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,16,1,power_law_1.01,0.4188096046447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,16,1,power_law_1.01,0.4425407886505127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,16,1,power_law_1.2,0.3809216022491455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,16,1,power_law_1.2,0.3934976100921631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,2,1,balanced,0.48084266980489093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,2,1,balanced,0.48188265164693195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,2,1,power_law_1.01,0.42581758499145506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,2,1,power_law_1.01,0.43468799591064455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,2,1,power_law_1.2,0.38988161087036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,2,1,power_law_1.2,0.39687039852142336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,32,1,balanced,0.4092586835225423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,32,1,balanced,0.4097599983215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,32,1,power_law_1.01,0.3582144021987915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,32,1,power_law_1.01,0.363916802406311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,32,1,power_law_1.2,0.3309056043624878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,32,1,power_law_1.2,0.33235199451446534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,4,1,balanced,0.27483733495076496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,4,1,balanced,0.27782400449117023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,4,1,power_law_1.01,0.2505728006362915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,4,1,power_law_1.01,0.25662078857421877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,4,1,power_law_1.2,0.23299839496612548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,4,1,power_law_1.2,0.2338495969772339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,8,1,balanced,0.17074666420618692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,8,1,balanced,0.1869279940923055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,8,1,power_law_1.01,0.15629440546035767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,8,1,power_law_1.01,0.15652480125427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,8,1,power_law_1.2,0.15000959634780883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,4096,2688,22,512,8,1,power_law_1.2,0.1506432056427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,1,balanced,0.43009599049886066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,1,balanced,0.43303465843200684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,1,power_law_1.01,0.38752639293670654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,1,power_law_1.01,0.43006720542907717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,1,power_law_1.2,0.41560959815979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,1,power_law_1.2,0.43130879402160643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,2,balanced,0.24755734205245972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,2,balanced,0.272053341070811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,2,power_law_1.01,0.22622079849243165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,2,power_law_1.01,0.23708798885345458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,2,power_law_1.2,0.23965439796447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,2,power_law_1.2,0.24900479316711427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,4,balanced,0.16697599490483603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,4,balanced,0.17220799128214517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,4,power_law_1.01,0.1536064028739929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,4,power_law_1.01,0.158188796043396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,4,power_law_1.2,0.15712000131607057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,4,power_law_1.2,0.15754879713058473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,8,balanced,0.11153599619865417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,8,balanced,0.11405866344769795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,8,power_law_1.01,0.11130880117416382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,8,power_law_1.01,0.11276160478591919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,8,power_law_1.2,0.11117440462112427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,1,8,power_law_1.2,0.11146880388259887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,16,1,balanced,0.05806933343410492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,16,1,balanced,0.06014933188756307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,16,1,power_law_1.01,0.05263360142707825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,16,1,power_law_1.01,0.05287039875984192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,16,1,power_law_1.2,0.052275198698043826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,16,1,power_law_1.2,0.05253120064735413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,2,1,balanced,0.22921599944432577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,2,1,balanced,0.24085867404937744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,2,1,power_law_1.01,0.20686719417572022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,2,1,power_law_1.01,0.22203519344329833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,2,1,power_law_1.2,0.22244479656219482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,2,1,power_law_1.2,0.23042559623718262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,32,1,balanced,0.03558400024970373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,32,1,balanced,0.03575466573238373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,32,1,power_law_1.01,0.03528960049152374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,32,1,power_law_1.01,0.036620798707008365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,32,1,power_law_1.2,0.034944000840187076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,32,1,power_law_1.2,0.03877759873867035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,4,1,balanced,0.13314132889111838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,4,1,balanced,0.1455946664015452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,4,1,power_law_1.01,0.1277119994163513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,4,1,power_law_1.01,0.13169280290603638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,4,1,power_law_1.2,0.13489919900894165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,4,1,power_law_1.2,0.14086400270462035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,8,1,balanced,0.08577066659927368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,8,1,balanced,0.08699733018875122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,8,1,power_law_1.01,0.07247359752655029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,8,1,power_law_1.01,0.07428479790687562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,8,1,power_law_1.2,0.07338879704475403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,16384,2,8,8,1,power_law_1.2,0.0754047989845276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,1,balanced,0.4112693468729655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,1,balanced,0.42104534308115643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,1,power_law_1.01,0.4094912052154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,1,power_law_1.01,0.4135424137115479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,1,power_law_1.2,0.4005568027496338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,1,power_law_1.2,0.40189437866210936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,128,balanced,0.0377866675456365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,128,balanced,0.03811199963092804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,128,power_law_1.01,0.04415999948978424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,128,power_law_1.01,0.04426240026950836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,128,power_law_1.2,0.04345600008964538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,128,power_law_1.2,0.044352000951766966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,16,balanced,0.06461866696675618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,16,balanced,0.06499200065930684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,16,power_law_1.01,0.13482880592346191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,16,power_law_1.01,0.1375040054321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,16,power_law_1.2,0.13736319541931152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,16,power_law_1.2,0.1378175973892212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,2,balanced,0.2304640014966329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,2,balanced,0.2397759954134623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,2,power_law_1.01,0.2636159896850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,2,power_law_1.01,0.2715264081954956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,2,power_law_1.2,0.2573951959609985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,2,power_law_1.2,0.26869759559631345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,256,balanced,0.03763733307520548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,256,balanced,0.037765334049860634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,256,power_law_1.01,0.036908799409866334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,256,power_law_1.01,0.03744640052318573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,256,power_law_1.2,0.037964800000190736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,256,power_law_1.2,0.03821440041065216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,32,balanced,0.04582933088143667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,32,balanced,0.047237331668535866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,32,power_law_1.01,0.08332800269126892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,32,power_law_1.01,0.08338559865951538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,32,power_law_1.2,0.0818880021572113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,32,power_law_1.2,0.08529919981956482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,4,balanced,0.13922133048375449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,4,balanced,0.14595733086268106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,4,power_law_1.01,0.20727040767669677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,4,power_law_1.01,0.2109312057495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,4,power_law_1.2,0.18961280584335327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,4,power_law_1.2,0.1984768033027649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,64,balanced,0.037717332442601524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,64,balanced,0.03984533250331879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,64,power_law_1.01,0.063673597574234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,64,power_law_1.01,0.0640447974205017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,64,power_law_1.2,0.057631999254226685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,64,power_law_1.2,0.06254079937934875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,8,balanced,0.08640000224113464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,8,balanced,0.08649067083994548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,8,power_law_1.01,0.1666432023048401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,8,power_law_1.01,0.18707200288772582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,8,power_law_1.2,0.17690880298614503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,1,8,power_law_1.2,0.17886719703674317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,16,1,balanced,0.062277331948280334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,16,1,balanced,0.0642080008983612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,16,1,power_law_1.01,0.06176000237464905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,16,1,power_law_1.01,0.061926400661468504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,16,1,power_law_1.2,0.060652798414230345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,16,1,power_law_1.2,0.060678398609161376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,2,1,balanced,0.2212160031000773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,2,1,balanced,0.22292800744374594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,2,1,power_law_1.01,0.22080640792846679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,2,1,power_law_1.01,0.22428159713745116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,2,1,power_law_1.2,0.2061824083328247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,2,1,power_law_1.2,0.20801279544830323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,32,1,balanced,0.051701332132021584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,32,1,balanced,0.05180266499519348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,32,1,power_law_1.01,0.054655998945236206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,32,1,power_law_1.01,0.054713600873947145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,32,1,power_law_1.2,0.0538752019405365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,32,1,power_law_1.2,0.05434240102767944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,4,1,balanced,0.1334933340549469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,4,1,balanced,0.13380799690882364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,4,1,power_law_1.01,0.13046400547027587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,4,1,power_law_1.01,0.1310912013053894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,4,1,power_law_1.2,0.12311040163040161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,4,1,power_law_1.2,0.12412159442901612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,8,1,balanced,0.08269866804281871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,8,1,balanced,0.0832586685816447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,8,1,power_law_1.01,0.08012800216674805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,8,1,power_law_1.01,0.08125439882278443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,8,1,power_law_1.2,0.07774080038070678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2048,8,256,8,1,power_law_1.2,0.07822719812393189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,1,balanced,0.504858652750651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,1,balanced,0.5065866708755493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,1,power_law_1.01,0.42759041786193847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,1,power_law_1.01,0.42858238220214845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,1,power_law_1.2,0.3897536039352417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,1,power_law_1.2,0.3951807975769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,16,balanced,0.06845866640408833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,16,balanced,0.06972800195217133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,16,power_law_1.01,0.10949120521545411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,16,power_law_1.01,0.11745920181274414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,16,power_law_1.2,0.10820480585098266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,16,power_law_1.2,0.111353600025177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,2,balanced,0.2780853311220805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,2,balanced,0.27826666831970215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,2,power_law_1.01,0.273638391494751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,2,power_law_1.01,0.291596794128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,2,power_law_1.2,0.25338881015777587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,2,power_law_1.2,0.2550463914871216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,32,balanced,0.05195199946562449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,32,balanced,0.05203733344872793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,32,power_law_1.01,0.06929280161857605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,32,power_law_1.01,0.07280640006065368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,32,power_law_1.2,0.0698751986026764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,32,power_law_1.2,0.07279999852180481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,4,balanced,0.1704853375752767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,4,balanced,0.1807253360748291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,4,power_law_1.01,0.17900799512863158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,4,power_law_1.01,0.19386240243911743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,4,power_law_1.2,0.16751359701156615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,4,power_law_1.2,0.18543360233306885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,8,balanced,0.10026666522026062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,8,balanced,0.10081600149472554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,8,power_law_1.01,0.1400320053100586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,8,power_law_1.01,0.165011203289032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,8,power_law_1.2,0.1429759979248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,1,8,power_law_1.2,0.16940159797668458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,16,1,balanced,0.07660266757011414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,16,1,balanced,0.07795199751853943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,16,1,power_law_1.01,0.07024639844894409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,16,1,power_law_1.01,0.0705407977104187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,16,1,power_law_1.2,0.06510080099105835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,16,1,power_law_1.2,0.06594560146331788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,2,1,balanced,0.26897066831588745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,2,1,balanced,0.2719786763191223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,2,1,power_law_1.01,0.23351678848266602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,2,1,power_law_1.01,0.23408639430999756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,2,1,power_law_1.2,0.20908160209655763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,2,1,power_law_1.2,0.21286399364471437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,32,1,balanced,0.06234133243560791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,32,1,balanced,0.062368000547091164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,32,1,power_law_1.01,0.05731199979782105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,32,1,power_law_1.01,0.0582144021987915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,32,1,power_law_1.2,0.0538752019405365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,32,1,power_law_1.2,0.05533440113067627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,4,1,balanced,0.16529599825541177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,4,1,balanced,0.1653439998626709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,4,1,power_law_1.01,0.14188799858093262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,4,1,power_law_1.01,0.14705920219421387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,4,1,power_law_1.2,0.1270848035812378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,4,1,power_law_1.2,0.1307263970375061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,8,1,balanced,0.10284266869227092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,8,1,balanced,0.10504000385602315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,8,1,power_law_1.01,0.08967040181159973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,8,1,power_law_1.01,0.09003520011901855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,8,1,power_law_1.2,0.08122239708900451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,6144,2560,8,160,8,1,power_law_1.2,0.08373119831085205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,1,balanced,0.47411731878916424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,1,balanced,0.4747146765391032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,1,power_law_1.01,0.47178239822387696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,1,power_law_1.01,0.4734655857086182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,1,power_law_1.2,0.4632575988769531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,1,power_law_1.2,0.46457600593566895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,128,balanced,0.042597333590189614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,128,balanced,0.04363733530044556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,128,power_law_1.01,0.048588800430297854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,128,power_law_1.01,0.04910080134868622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,128,power_law_1.2,0.04864639937877655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,128,power_law_1.2,0.0497408002614975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,16,balanced,0.06832000116507213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,16,balanced,0.07084799806276958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,16,power_law_1.01,0.14747519493103028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,16,power_law_1.01,0.14963200092315673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,16,power_law_1.2,0.14914560317993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,16,power_law_1.2,0.150764799118042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,2,balanced,0.2641493280728658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,2,balanced,0.26498667399088544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,2,power_law_1.01,0.3117055892944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,2,power_law_1.01,0.3137792110443115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,2,power_law_1.2,0.29098238945007326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,2,power_law_1.2,0.3027071952819824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,256,balanced,0.04265599946180979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,256,balanced,0.04376000165939331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,256,power_law_1.01,0.04088320136070252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,256,power_law_1.01,0.041843199729919435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,256,power_law_1.2,0.04046719968318939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,256,power_law_1.2,0.040870401263237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,32,balanced,0.04974933465321859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,32,balanced,0.055770665407180786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,32,power_law_1.01,0.09207680225372314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,32,power_law_1.01,0.0944320023059845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,32,power_law_1.2,0.0921280026435852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,32,power_law_1.2,0.09258239865303039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,4,balanced,0.15995200475056967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,4,balanced,0.17244799931844076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,4,power_law_1.01,0.24490880966186523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,4,power_law_1.01,0.25194880962371824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,4,power_law_1.2,0.2149951934814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,4,power_law_1.2,0.22722558975219725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,64,balanced,0.041738669077555336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,64,balanced,0.04362666606903076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,64,power_law_1.01,0.06794880032539367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,64,power_law_1.01,0.06835200190544129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,64,power_law_1.2,0.06656640172004699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,64,power_law_1.2,0.06722559928894042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,8,balanced,0.09503466884295146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,8,balanced,0.09900266925493877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,8,power_law_1.01,0.19175039529800414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,8,power_law_1.01,0.20007679462432862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,8,power_law_1.2,0.18315520286560058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,1,8,power_law_1.2,0.19200639724731444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,16,1,balanced,0.06962666908899943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,16,1,balanced,0.07253866891066234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,16,1,power_law_1.01,0.06810879707336426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,16,1,power_law_1.01,0.06876800060272217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,16,1,power_law_1.2,0.06725760102272034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,16,1,power_law_1.2,0.06788480281829834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,2,1,balanced,0.25031999746958417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,2,1,balanced,0.2594719926516215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,2,1,power_law_1.01,0.2504832029342651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,2,1,power_law_1.01,0.2519295930862427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,2,1,power_law_1.2,0.23432960510253906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,2,1,power_law_1.2,0.23619840145111085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,32,1,balanced,0.05982933441797892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,32,1,balanced,0.06075733403364817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,32,1,power_law_1.01,0.061504000425338747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,32,1,power_law_1.01,0.061791998147964475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,32,1,power_law_1.2,0.06053119897842407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,32,1,power_law_1.2,0.06077439785003662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,4,1,balanced,0.15099199612935385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,4,1,balanced,0.1518880029519399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,4,1,power_law_1.01,0.1467136025428772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,4,1,power_law_1.01,0.14956159591674806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,4,1,power_law_1.2,0.13826559782028197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,4,1,power_law_1.2,0.14237439632415771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,8,1,balanced,0.09154133001963298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,8,1,balanced,0.09701866904894511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,8,1,power_law_1.01,0.09006720185279846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,8,1,power_law_1.01,0.09043840169906617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,8,1,power_law_1.2,0.08647040128707886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,256,8,1,power_law_1.2,0.08799999952316284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,1,balanced,0.47408533096313477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,1,balanced,0.4754720131556193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,1,power_law_1.01,0.47309441566467286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,1,power_law_1.01,0.47405438423156737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,1,power_law_1.2,0.47207040786743165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,1,power_law_1.2,0.473689603805542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,128,balanced,0.04170133173465729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,128,balanced,0.043680002291997276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,128,power_law_1.01,0.06000000238418579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,128,power_law_1.01,0.06059520244598389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,128,power_law_1.2,0.06021760106086731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,128,power_law_1.2,0.06058239936828613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,16,balanced,0.07037333150704701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,16,balanced,0.07054933408896129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,16,power_law_1.01,0.19748480319976808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,16,power_law_1.01,0.2001471996307373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,16,power_law_1.2,0.19319679737091064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,16,power_law_1.2,0.20263679027557374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,2,balanced,0.2608213424682617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,2,balanced,0.26418666044871014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,2,power_law_1.01,0.32924799919128417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,2,power_law_1.01,0.33658881187438966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,2,power_law_1.2,0.3412224054336548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,2,power_law_1.2,0.3428607940673828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,32,balanced,0.04994666576385498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,32,balanced,0.05004799862702688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,32,power_law_1.01,0.13506560325622557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,32,power_law_1.01,0.1360576033592224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,32,power_law_1.2,0.13630080223083496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,32,power_law_1.2,0.1380735993385315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,4,balanced,0.1529759963353475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,4,balanced,0.15311466654141745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,4,power_law_1.01,0.25871360301971436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,4,power_law_1.01,0.26024320125579836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,4,power_law_1.2,0.27397119998931885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,4,power_law_1.2,0.29044480323791505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,64,balanced,0.04372266431649526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,64,balanced,0.04387199878692627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,64,power_law_1.01,0.0794368028640747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,64,power_law_1.01,0.0802623987197876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,64,power_law_1.2,0.07907840013504028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,64,power_law_1.2,0.07985919713973999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,8,balanced,0.0944106678167979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,8,balanced,0.09609599908192952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,8,power_law_1.01,0.21262719631195068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,8,power_law_1.01,0.2140671968460083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,8,power_law_1.2,0.22522881031036376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,1,8,power_law_1.2,0.2253887891769409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,16,1,balanced,0.06966933111349742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,16,1,balanced,0.06996266543865204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,16,1,power_law_1.01,0.06793599724769592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,16,1,power_law_1.01,0.06878719925880432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,16,1,power_law_1.2,0.06865280270576476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,16,1,power_law_1.2,0.06929919719696045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,2,1,balanced,0.25471999247868854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,2,1,balanced,0.2553866704305013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,2,1,power_law_1.01,0.24990079402923585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,2,1,power_law_1.01,0.2524415969848633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,2,1,power_law_1.2,0.2503743886947632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,2,1,power_law_1.2,0.25138559341430666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,32,1,balanced,0.05982933441797892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,32,1,balanced,0.06020799775918325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,32,1,power_law_1.01,0.06094719767570496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,32,1,power_law_1.01,0.061267197132110596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,32,1,power_law_1.2,0.06183040142059326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,32,1,power_law_1.2,0.061926400661468504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,4,1,balanced,0.14670933286348978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,4,1,balanced,0.14801067113876343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,4,1,power_law_1.01,0.14620159864425658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,4,1,power_law_1.01,0.14833279848098754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,4,1,power_law_1.2,0.14706560373306274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,4,1,power_law_1.2,0.14869120121002197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,8,1,balanced,0.09245333075523376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,8,1,balanced,0.0928000013033549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,8,1,power_law_1.01,0.08990079760551453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,8,1,power_law_1.01,0.09057919979095459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,8,1,power_law_1.2,0.09049599766731262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8,7168,2048,8,384,8,1,power_law_1.2,0.09082880020141601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,1,balanced,0.14451733231544495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,1,balanced,0.14541332920392355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,1,power_law_1.01,0.13464319705963135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,1,power_law_1.01,0.13654400110244752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,1,power_law_1.2,0.13787519931793213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,1,power_law_1.2,0.13985919952392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,128,balanced,0.03738666574160258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,128,balanced,0.03754133234421412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,128,power_law_1.01,0.036575999855995175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,128,power_law_1.01,0.037036800384521486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,128,power_law_1.2,0.036364799737930296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,128,power_law_1.2,0.03648639917373657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,16,balanced,0.03982399900754293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,16,balanced,0.04188799858093262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,16,power_law_1.01,0.039878401160240176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,16,power_law_1.01,0.04012799859046936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,16,power_law_1.2,0.03934719860553741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,16,power_law_1.2,0.039699199795722964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,2,balanced,0.09706133604049683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,2,balanced,0.09860799709955852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,2,power_law_1.01,0.09411839842796325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,2,power_law_1.01,0.09534080028533935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,2,power_law_1.2,0.09467520117759705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,2,power_law_1.2,0.09516159892082214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,32,balanced,0.03774933268626531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,32,balanced,0.039274667700131737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,32,power_law_1.01,0.037190398573875426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,32,power_law_1.01,0.037254399061203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,32,power_law_1.2,0.037350401282310486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,32,power_law_1.2,0.037484800815582274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,4,balanced,0.07082666456699371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,4,balanced,0.072202667593956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,4,power_law_1.01,0.066048002243042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,4,power_law_1.01,0.06799359917640686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,4,power_law_1.2,0.06713600158691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,4,power_law_1.2,0.06873599886894226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,64,balanced,0.037690666814645134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,64,balanced,0.037834666669368744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,64,power_law_1.01,0.03685120046138764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,64,power_law_1.01,0.03691520094871521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,64,power_law_1.2,0.03686400055885315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,64,power_law_1.2,0.037011200189590455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,8,balanced,0.04897066454092661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,8,balanced,0.049957334995269775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,8,power_law_1.01,0.04880000054836273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,8,power_law_1.01,0.04921599924564361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,8,power_law_1.2,0.049292799830436704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,1,8,power_law_1.2,0.04973439872264862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,2,1,balanced,0.10085866848627727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,2,1,balanced,0.10160000125567119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,2,1,power_law_1.01,0.09255040287971497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,2,1,power_law_1.01,0.09471359848976135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,2,1,power_law_1.2,0.09404159784317016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,2,1,power_law_1.2,0.09581440091133117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,4,1,balanced,0.07110933462778728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,4,1,balanced,0.07248533268769582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,4,1,power_law_1.01,0.06819199919700622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,4,1,power_law_1.01,0.06842880249023438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,4,1,power_law_1.2,0.06896640062332153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2048,768,8,128,4,1,power_law_1.2,0.06913920044898987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,1,balanced,0.3631253242492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,1,balanced,0.3638240098953247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,1,power_law_1.01,0.3210943937301636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,1,power_law_1.01,0.32274560928344725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,1,power_law_1.2,0.3201792001724243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,1,power_law_1.2,0.32517759799957274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,128,balanced,0.045519997676213585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,128,balanced,0.045925334095954895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,128,power_law_1.01,0.04459519982337952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,128,power_law_1.01,0.04506880044937134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,128,power_law_1.2,0.04455040097236633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,128,power_law_1.2,0.04496639966964722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,16,balanced,0.06685866912206014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,16,balanced,0.06820799907048543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,16,power_law_1.01,0.06603519916534424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,16,power_law_1.01,0.06632320284843445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,16,power_law_1.2,0.06478719711303711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,16,power_law_1.2,0.06578559875488281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,2,balanced,0.21159466107686362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,2,balanced,0.21287467082341513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,2,power_law_1.01,0.1804927945137024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,2,power_law_1.01,0.1814784049987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,2,power_law_1.2,0.18216960430145263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,2,power_law_1.2,0.1904703974723816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,32,balanced,0.054085334142049156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,32,balanced,0.05425066749254862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,32,power_law_1.01,0.05196800231933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,32,power_law_1.01,0.05262079834938049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,32,power_law_1.2,0.05043839812278748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,32,power_law_1.2,0.052748799324035645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,4,balanced,0.13051733374595642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,4,balanced,0.13402133186658224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,4,power_law_1.01,0.12206720113754273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,4,power_law_1.01,0.12246400117874146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,4,power_law_1.2,0.11656960248947143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,4,power_law_1.2,0.12149759531021118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,64,balanced,0.04576000074545542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,64,balanced,0.045909335215886436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,64,power_law_1.01,0.04487679898738861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,64,power_law_1.01,0.04523519873619079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,64,power_law_1.2,0.045132800936698914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,64,power_law_1.2,0.04555520117282867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,8,balanced,0.08895466725031535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,8,balanced,0.09012800455093384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,8,power_law_1.01,0.08646399974822998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,8,power_law_1.01,0.0867904007434845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,8,power_law_1.2,0.08451200127601624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,1,8,power_law_1.2,0.08601599931716919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,16,1,balanced,0.7624639670054117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,16,1,balanced,0.7639946937561035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,16,1,power_law_1.01,0.6721536159515381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,16,1,power_law_1.01,0.6998015880584717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,16,1,power_law_1.2,0.6760767936706543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,16,1,power_law_1.2,0.677177619934082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,2,1,balanced,0.21228265762329102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,2,1,balanced,0.2135253349939982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,2,1,power_law_1.01,0.1835904002189636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,2,1,power_law_1.01,0.1889855980873108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,2,1,power_law_1.2,0.18719359636306762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,2,1,power_law_1.2,0.19301120042800904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,32,1,balanced,0.7468106746673584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,32,1,balanced,0.7487733364105225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,32,1,power_law_1.01,0.6523327827453613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,32,1,power_law_1.01,0.6680384159088135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,32,1,power_law_1.2,0.6702079772949219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,32,1,power_law_1.2,0.6703231811523438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,4,1,balanced,0.1323093374570211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,4,1,balanced,0.13302399714787802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,4,1,power_law_1.01,0.11836800575256348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,4,1,power_law_1.01,0.12168960571289063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,4,1,power_law_1.2,0.12408319711685181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,8,1,balanced,1.2619946797688801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,8,1,balanced,1.2670400142669678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,8,1,power_law_1.01,1.092512035369873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,8,1,power_law_1.01,1.1194751739501954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,8,1,power_law_1.2,1.120569610595703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,2688,1856,6,128,8,1,power_law_1.2,1.1265151977539063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,1,balanced,0.6304159959157308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,1,balanced,0.6364906628926595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,1,power_law_1.01,0.4902207851409912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,1,power_law_1.01,0.509497594833374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,1,power_law_1.2,0.49358081817626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,1,power_law_1.2,0.5024064064025879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,128,balanced,0.045941332976023354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,128,balanced,0.04621333380540212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,128,power_law_1.01,0.04624640047550201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,128,power_law_1.01,0.04625920057296753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,128,power_law_1.2,0.04599039852619171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,128,power_law_1.2,0.04643200039863586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,16,balanced,0.09337600072224934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,16,balanced,0.09360000491142273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,16,power_law_1.01,0.08054400086402894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,16,power_law_1.01,0.0823743999004364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,16,power_law_1.2,0.08297600150108338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,16,power_law_1.2,0.08590720295906067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,2,balanced,0.3454986810684204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,2,balanced,0.34858667850494385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,2,power_law_1.01,0.28589439392089844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,2,power_law_1.01,0.2949631929397583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,2,power_law_1.2,0.27194240093231203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,2,power_law_1.2,0.27241599559783936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,256,balanced,0.045663997530937195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,256,balanced,0.046629334489504494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,256,power_law_1.01,0.04538240134716034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,256,power_law_1.01,0.045535999536514285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,256,power_law_1.2,0.04527359902858734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,256,power_law_1.2,0.04540160000324249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,32,balanced,0.06790400048096974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,32,balanced,0.06819200019041698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,32,power_law_1.01,0.0654591977596283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,32,power_law_1.01,0.06638720035552978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,32,power_law_1.2,0.06506239771842956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,32,power_law_1.2,0.06595199704170226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,4,balanced,0.19825599590937296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,4,balanced,0.19948800404866537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,4,power_law_1.01,0.16549760103225708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,4,power_law_1.01,0.16879359483718873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,4,power_law_1.2,0.1656000018119812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,4,power_law_1.2,0.17620480060577393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,64,balanced,0.04898133377234141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,64,balanced,0.04996266464392344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,64,power_law_1.01,0.047539201378822324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,64,power_law_1.01,0.047788798809051514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,64,power_law_1.2,0.04787839949131012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,64,power_law_1.2,0.04833920001983642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,8,balanced,0.12909332911173502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,8,balanced,0.13063466548919678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,8,power_law_1.01,0.116428804397583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,8,power_law_1.01,0.12068480253219604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,8,power_law_1.2,0.10619519948959351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,1,8,power_law_1.2,0.11668479442596436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,16,1,balanced,0.1135093371073405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,16,1,balanced,0.114464004834493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,16,1,power_law_1.01,0.09857280254364013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,16,1,power_law_1.01,0.099891197681427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,16,1,power_law_1.2,0.09339519739151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,16,1,power_law_1.2,0.0949567973613739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,2,1,balanced,0.35075732072194415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,2,1,balanced,0.3522453308105469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,2,1,power_law_1.01,0.2806272029876709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,2,1,power_law_1.01,0.28178560733795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,2,1,power_law_1.2,0.2792383909225464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,2,1,power_law_1.2,0.2813055992126465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,32,1,balanced,0.09513066212336223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,32,1,balanced,0.0963253378868103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,32,1,power_law_1.01,0.0810368001461029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,32,1,power_law_1.01,0.08218880295753479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,32,1,power_law_1.2,0.08170239925384522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,32,1,power_law_1.2,0.08178560137748718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,4,1,balanced,0.21105599403381348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,4,1,balanced,0.21162132422129312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,4,1,power_law_1.01,0.1714560031890869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,4,1,power_law_1.01,0.17499519586563111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,4,1,power_law_1.2,0.167193603515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,4,1,power_law_1.2,0.1677888035774231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,8,1,balanced,0.14937067031860352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,8,1,balanced,0.14966932932535806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,8,1,power_law_1.01,0.12184319496154786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,8,1,power_law_1.01,0.12323199510574341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,8,1,power_law_1.2,0.11953279972076417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,3072,1536,8,256,8,1,power_law_1.2,0.1217919945716858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,1,balanced,0.3020906647046407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,1,balanced,0.30403733253479004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,1,power_law_1.01,0.359500789642334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,1,power_law_1.01,0.36639358997344973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,1,power_law_1.2,0.36868479251861574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,1,power_law_1.2,0.36871039867401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,2,balanced,0.22344533602396646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,2,balanced,0.23804799715677896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,2,power_law_1.01,0.2362816095352173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,2,power_law_1.01,0.24318079948425292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,2,power_law_1.2,0.2409280061721802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,2,power_law_1.2,0.24416000843048097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,4,balanced,0.15945067008336386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,4,balanced,0.16105600198109946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,4,power_law_1.01,0.179750394821167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,4,power_law_1.01,0.1956480026245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,4,power_law_1.2,0.18855040073394774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,4,power_law_1.2,0.19626879692077637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,8,balanced,0.13766400019327799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,8,balanced,0.1399733324845632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,8,power_law_1.01,0.15802240371704102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,8,power_law_1.01,0.16828800439834596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,8,power_law_1.2,0.15889279842376708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,1,8,power_law_1.2,0.16136319637298585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,16,1,balanced,0.05180266499519348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,16,1,balanced,0.05190933247407278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,16,1,power_law_1.01,0.054150402545928955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,16,1,power_law_1.01,0.05674880146980286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,16,1,power_law_1.2,0.05692160129547119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,16,1,power_law_1.2,0.05749120116233826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,2,1,balanced,0.1789919932683309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,2,1,balanced,0.20870399475097656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,2,1,power_law_1.01,0.19524480104446412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,2,1,power_law_1.01,0.1966655969619751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,2,1,power_law_1.2,0.19765759706497193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,2,1,power_law_1.2,0.19953919649124147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,32,1,balanced,0.04350399971008301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,32,1,balanced,0.043840001026789345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,32,1,power_law_1.01,0.0438975989818573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,32,1,power_law_1.01,0.04407039880752563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,32,1,power_law_1.2,0.04439040124416351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,32,1,power_law_1.2,0.04447360038757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,4,1,balanced,0.1090773344039917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,4,1,balanced,0.10956266522407532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,4,1,power_law_1.01,0.1177791953086853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,4,1,power_law_1.01,0.12220799922943115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,4,1,power_law_1.2,0.11811200380325318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,4,1,power_law_1.2,0.12492159605026246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,8,1,balanced,0.07449066638946533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,8,1,balanced,0.0755680004755656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,8,1,power_law_1.01,0.0809984028339386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,8,1,power_law_1.01,0.08587520122528076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,8,1,power_law_1.2,0.08142079710960388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,14336,2,8,8,1,power_law_1.2,0.08273280262947083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,1,balanced,0.4431999921798706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,1,balanced,0.44405333201090497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,1,power_law_1.01,0.40174078941345215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,1,power_law_1.01,0.409606409072876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,1,power_law_1.2,0.4090752124786377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,1,power_law_1.2,0.414412784576416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,128,balanced,0.049866666396458946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,128,balanced,0.050016000866889954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,128,power_law_1.01,0.049497601389884946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,128,power_law_1.01,0.049593600630760196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,128,power_law_1.2,0.049491199851036075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,128,power_law_1.2,0.04952960014343262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,16,balanced,0.07858133316040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,16,balanced,0.08011200030644734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,16,power_law_1.01,0.07505919933319091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,16,power_law_1.01,0.07694079875946044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,16,power_law_1.2,0.07619199752807618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,16,power_law_1.2,0.07724159955978394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,2,balanced,0.24460800488789877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,2,balanced,0.24818666776021323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,2,power_law_1.01,0.2352447986602783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,2,power_law_1.01,0.2399679899215698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,2,power_law_1.2,0.2367232084274292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,2,power_law_1.2,0.23685760498046876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,32,balanced,0.0582826683918635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,32,balanced,0.0599839985370636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,32,power_law_1.01,0.057715201377868654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,32,power_law_1.01,0.058336001634597776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,32,power_law_1.2,0.0585536003112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,32,power_law_1.2,0.058976000547409056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,4,balanced,0.15341867009798685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,4,balanced,0.1536853313446045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,4,power_law_1.01,0.1489408016204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,4,power_law_1.01,0.14908159971237184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,4,power_law_1.2,0.14781440496444703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,4,power_law_1.2,0.14828159809112548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,64,balanced,0.05018133421738943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,64,balanced,0.05197333296140035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,64,power_law_1.01,0.05006080269813538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,64,power_law_1.01,0.05025920271873474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,64,power_law_1.2,0.04958080053329468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,64,power_law_1.2,0.04967679977416992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,8,balanced,0.10743467013041179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,8,balanced,0.1076586643854777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,8,power_law_1.01,0.0993664026260376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,8,power_law_1.01,0.1011199951171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,8,power_law_1.2,0.10158720016479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,1,8,power_law_1.2,0.1019327998161316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,16,1,balanced,0.08793600400288899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,16,1,balanced,0.08874666690826416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,16,1,power_law_1.01,0.08387200236320495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,16,1,power_law_1.01,0.08458240032196045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,16,1,power_law_1.2,0.08408960103988647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,16,1,power_law_1.2,0.08420479893684388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,2,1,balanced,0.24905065695444742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,2,1,balanced,0.24940800666809082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,2,1,power_law_1.01,0.22969601154327393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,2,1,power_law_1.01,0.23899519443511963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,2,1,power_law_1.2,0.2330944061279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,2,1,power_law_1.2,0.23827838897705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,32,1,balanced,0.07322666545708974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,32,1,balanced,0.07426666716734569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,32,1,power_law_1.01,0.06844800114631652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,32,1,power_law_1.01,0.06962559819221496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,32,1,power_law_1.2,0.06995199918746949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,32,1,power_law_1.2,0.07034239768981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,4,1,balanced,0.1643893321355184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,4,1,balanced,0.16894932587941489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,4,1,power_law_1.01,0.1522112011909485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,4,1,power_law_1.01,0.15266560316085814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,4,1,power_law_1.2,0.15383679866790773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,4,1,power_law_1.2,0.1541375994682312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,8,1,balanced,0.11032000184059143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,8,1,balanced,0.11185600360234578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,8,1,power_law_1.01,0.10569599866867066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,8,1,power_law_1.01,0.10571520328521729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,8,1,power_law_1.2,0.10611200332641602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,1536,8,128,8,1,power_law_1.2,0.10677759647369385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,1,balanced,2.769450823465983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,1,balanced,2.7768214543660483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,1,power_law_1.01,2.321664047241211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,1,power_law_1.01,2.412518310546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,1,power_law_1.2,2.3567232131958007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,1,power_law_1.2,2.3820928573608398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,128,balanced,0.09904000163078308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,128,balanced,0.09920000036557515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,128,power_law_1.01,0.09326720237731934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,128,power_law_1.01,0.096288001537323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,128,power_law_1.2,0.0964352011680603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,128,power_law_1.2,0.0974399983882904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,16,balanced,0.25140267610549927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,16,balanced,0.252895991007487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,16,power_law_1.01,0.22862720489501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,16,power_law_1.01,0.22973439693450928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,16,power_law_1.2,0.2283776044845581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,16,power_law_1.2,0.2420032024383545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,2,balanced,1.4381972948710124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,2,balanced,1.4492905934651692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,2,power_law_1.01,1.2069439888000488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,2,power_law_1.01,1.2738240242004395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,2,power_law_1.2,1.2240192413330078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,2,power_law_1.2,1.22607364654541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,256,balanced,0.08252800007661183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,256,balanced,0.08364267150561015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,256,power_law_1.01,0.0818560004234314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,256,power_law_1.01,0.08200960159301758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,256,power_law_1.2,0.08135679960250855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,256,power_law_1.2,0.08203520178794861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,32,balanced,0.17018133401870728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,32,balanced,0.1710453430811564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,32,power_law_1.01,0.15665279626846312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,32,power_law_1.01,0.1569983959197998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,32,power_law_1.2,0.1551424026489258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,32,power_law_1.2,0.15717120170593263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,4,balanced,0.7568746407826742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,4,balanced,0.7612533569335938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,4,power_law_1.01,0.6593855857849121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,4,power_law_1.01,0.6681280136108398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,4,power_law_1.2,0.6692416191101074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,4,power_law_1.2,0.6840703964233399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,64,balanced,0.11710400382677714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,64,balanced,0.11972799897193909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,64,power_law_1.01,0.11460479497909545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,64,power_law_1.01,0.11498880386352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,64,power_law_1.2,0.11249920129776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,64,power_law_1.2,0.11265280246734619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,8,balanced,0.41942934195200604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,8,balanced,0.4214133421579997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,8,power_law_1.01,0.3832319974899292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,8,power_law_1.01,0.40159358978271487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,8,power_law_1.2,0.3603584051132202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,1,8,power_law_1.2,0.36909439563751223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,16,1,balanced,7.5550187428792315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,16,1,balanced,7.558757146199544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,16,1,power_law_1.01,6.27391357421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,16,1,power_law_1.01,6.362112045288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,16,1,power_law_1.2,6.387641525268554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,16,1,power_law_1.2,6.468473815917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,2,1,balanced,1.4453706741333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,2,1,balanced,1.5318133036295574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,2,1,power_law_1.01,1.2148863792419433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,2,1,power_law_1.01,1.234931182861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,2,1,power_law_1.2,1.2185855865478517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,2,1,power_law_1.2,1.2231807708740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,32,1,balanced,4.515215873718262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,32,1,balanced,4.518746693929036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,32,1,power_law_1.01,3.7789119720458983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,32,1,power_law_1.01,3.848019027709961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,32,1,power_law_1.2,3.771321487426758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,32,1,power_law_1.2,3.816409683227539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,4,1,balanced,0.8099359671274821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,4,1,balanced,0.8105279604593912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,4,1,power_law_1.01,0.68023681640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,4,1,power_law_1.01,0.6890751838684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,4,1,power_law_1.2,0.6840191841125488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,4,1,power_law_1.2,0.6840384006500244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,8,1,balanced,0.48212265968322754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,8,1,balanced,0.49537599086761475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,8,1,power_law_1.01,0.4105408191680908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,8,1,power_law_1.01,0.41472640037536623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,8,1,power_law_1.2,0.41125121116638186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,4096,2688,22,512,8,1,power_law_1.2,0.41654400825500487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,1,balanced,0.5153066714604696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,1,balanced,0.5169066588083903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,1,power_law_1.01,0.5717567920684814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,1,power_law_1.01,0.574399995803833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,1,power_law_1.2,0.5779007911682129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,1,power_law_1.2,0.5894464015960693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,2,balanced,0.29363733530044556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,2,balanced,0.30105066299438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,2,power_law_1.01,0.39617919921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,2,power_law_1.01,0.39663360118865965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,2,power_law_1.2,0.3891968011856079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,2,power_law_1.2,0.3985152006149292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,4,balanced,0.20975999037424722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,4,balanced,0.22073066234588623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,4,power_law_1.01,0.2625983953475952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,4,power_law_1.01,0.26293120384216306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,4,power_law_1.2,0.265446400642395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,4,power_law_1.2,0.2876672029495239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,8,balanced,0.176746666431427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,8,balanced,0.18581332763036093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,8,power_law_1.01,0.20625920295715333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,8,power_law_1.01,0.21521279811859131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,8,power_law_1.2,0.1932736039161682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,1,8,power_law_1.2,0.20592000484466552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,16,1,balanced,0.07673066854476929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,16,1,balanced,0.08027199904123943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,16,1,power_law_1.01,0.08170880079269409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,16,1,power_law_1.01,0.08450559973716736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,16,1,power_law_1.2,0.08184319734573364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,16,1,power_law_1.2,0.08199040293693542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,2,1,balanced,0.28244266907374066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,2,1,balanced,0.28355733553568524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,2,1,power_law_1.01,0.286297607421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,2,1,power_law_1.01,0.29859199523925783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,2,1,power_law_1.2,0.3069119930267334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,2,1,power_law_1.2,0.3074944019317627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,32,1,balanced,0.057706668972969055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,32,1,balanced,0.05826666454474131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,32,1,power_law_1.01,0.06062080264091492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,32,1,power_law_1.01,0.06299520134925843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,32,1,power_law_1.2,0.05976319909095764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,32,1,power_law_1.2,0.061452800035476686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,4,1,balanced,0.1590079963207245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,4,1,balanced,0.1595253348350525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,4,1,power_law_1.01,0.17121280431747438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,4,1,power_law_1.01,0.1789247989654541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,4,1,power_law_1.2,0.17255040407180786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,4,1,power_law_1.2,0.17863039970397948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,8,1,balanced,0.11077333490053813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,8,1,balanced,0.12494400143623352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,8,1,power_law_1.01,0.11336319446563721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,8,1,power_law_1.01,0.11392639875411988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,8,1,power_law_1.2,0.11450239419937133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,16384,2,8,8,1,power_law_1.2,0.11512320041656494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,1,balanced,1.6375679969787598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,1,balanced,1.6860853830973308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,1,power_law_1.01,1.270464038848877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,1,power_law_1.01,1.284870433807373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,1,power_law_1.2,1.2550080299377442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,1,power_law_1.2,1.2944767951965332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,128,balanced,0.06922666728496552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,128,balanced,0.07250666618347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,128,power_law_1.01,0.06929280161857605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,128,power_law_1.01,0.07100160121917724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,128,power_law_1.2,0.0709119975566864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,128,power_law_1.2,0.07110400199890136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,16,balanced,0.15658666690190634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,16,balanced,0.1585919956366221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,16,power_law_1.01,0.15024640560150146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,16,power_law_1.01,0.15456000566482545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,16,power_law_1.2,0.15041919946670532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,16,power_law_1.2,0.1531008005142212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,2,balanced,0.8548266887664795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,2,balanced,0.8593760331471761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,2,power_law_1.01,0.7120895862579346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,2,power_law_1.01,0.729036808013916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,2,power_law_1.2,0.6704832077026367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,2,power_law_1.2,0.7043392181396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,256,balanced,0.0631466656923294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,256,balanced,0.0631573349237442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,256,power_law_1.01,0.06231039762496948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,256,power_law_1.01,0.0627135992050171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,256,power_law_1.2,0.06233599781990051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,256,power_law_1.2,0.06282879710197449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,32,balanced,0.12154133121172588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,32,balanced,0.12237333257993062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,32,power_law_1.01,0.099481600522995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,32,power_law_1.01,0.10777599811553955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,32,power_law_1.2,0.10694400072097779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,32,power_law_1.2,0.11134719848632812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,4,balanced,0.46355199813842773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,4,balanced,0.46581868330637616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,4,power_law_1.01,0.3896192073822021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,4,power_law_1.01,0.4417280197143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,4,power_law_1.2,0.36669440269470216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,4,power_law_1.2,0.3823999881744385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,64,balanced,0.09187733133633931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,64,balanced,0.09474133451779683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,64,power_law_1.01,0.09177600145339966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,64,power_law_1.01,0.09284480214118958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,64,power_law_1.2,0.08529279828071594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,64,power_law_1.2,0.09073280096054077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,8,balanced,0.26346667607625324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,8,balanced,0.264138658841451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,8,power_law_1.01,0.22509438991546632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,8,power_law_1.01,0.22943999767303466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,8,power_law_1.2,0.23070719242095947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,1,8,power_law_1.2,0.2427135944366455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,16,1,balanced,0.19333332777023315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,16,1,balanced,0.1946986714998881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,16,1,power_law_1.01,0.16151679754257203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,16,1,power_law_1.01,0.1655743956565857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,16,1,power_law_1.2,0.1572864055633545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,16,1,power_law_1.2,0.16053119897842408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,2,1,balanced,0.8563840389251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,2,1,balanced,0.8577919801076254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,2,1,power_law_1.01,0.667142391204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,2,1,power_law_1.01,0.6878719806671143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,2,1,power_law_1.2,0.6597119808197022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,2,1,power_law_1.2,0.6832191944122314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,32,1,balanced,0.1625759998957316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,32,1,balanced,0.16299200057983398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,32,1,power_law_1.01,0.14075520038604736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,32,1,power_law_1.01,0.14134399890899657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,32,1,power_law_1.2,0.1396415948867798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,32,1,power_law_1.2,0.1396607995033264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,4,1,balanced,0.48179733753204346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,4,1,balanced,0.48367468516031903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,4,1,power_law_1.01,0.37493760585784913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,4,1,power_law_1.01,0.3788928031921387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,4,1,power_law_1.2,0.3740992069244385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,4,1,power_law_1.2,0.3767231941223145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,8,1,balanced,0.29316266377766925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,8,1,balanced,0.29474665721257526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,8,1,power_law_1.01,0.25068159103393556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,8,1,power_law_1.01,0.25077760219573975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,8,1,power_law_1.2,0.24865279197692872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2048,8,256,8,1,power_law_1.2,0.2535423994064331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,1,balanced,1.2949706713358562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,1,balanced,1.3329173723856609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,1,power_law_1.01,1.1279744148254394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,1,power_law_1.01,1.131385612487793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,1,power_law_1.2,1.1377984046936036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,1,power_law_1.2,1.1481792449951171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,16,balanced,0.1469066639741262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,16,balanced,0.1473973294099172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,16,power_law_1.01,0.13367040157318116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,16,power_law_1.01,0.13693439960479736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,16,power_law_1.2,0.13252480030059816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,16,power_law_1.2,0.13320319652557372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,2,balanced,0.6856373151143392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,2,balanced,0.6881120204925537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,2,power_law_1.01,0.6010623931884765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,2,power_law_1.01,0.616319990158081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,2,power_law_1.2,0.6074816226959229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,2,power_law_1.2,0.6167424201965332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,32,balanced,0.10557867089907329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,32,balanced,0.10668266812960307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,32,power_law_1.01,0.0997439980506897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,32,power_law_1.01,0.10439679622650147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,32,power_law_1.2,0.10035840272903443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,32,power_law_1.2,0.10239360332489014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,4,balanced,0.37162665526072186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,4,balanced,0.37512000401814777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,4,power_law_1.01,0.33665919303894043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,4,power_law_1.01,0.3523519992828369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,4,power_law_1.2,0.3374592065811157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,4,power_law_1.2,0.3395711898803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,8,balanced,0.22046933571497598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,8,balanced,0.23110934098561606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,8,power_law_1.01,0.2133375883102417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,8,power_law_1.01,0.2135296106338501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,8,power_law_1.2,0.21296000480651855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,1,8,power_law_1.2,0.21965439319610597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,16,1,balanced,0.17702933152516684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,16,1,balanced,0.17785600821177164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,16,1,power_law_1.01,0.16702719926834106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,16,1,power_law_1.01,0.16840319633483886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,16,1,power_law_1.2,0.16381440162658692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,16,1,power_law_1.2,0.16686079502105713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,2,1,balanced,0.6731733481089274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,2,1,balanced,0.6796159744262695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,2,1,power_law_1.01,0.5903679847717285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,2,1,power_law_1.01,0.5937407970428467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,2,1,power_law_1.2,0.6001023769378662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,2,1,power_law_1.2,0.6077888011932373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,32,1,balanced,0.14407466848691305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,32,1,balanced,0.145797332127889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,32,1,power_law_1.01,0.12858879566192627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,32,1,power_law_1.01,0.13178880214691163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,32,1,power_law_1.2,0.13345279693603515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,32,1,power_law_1.2,0.134278404712677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,4,1,balanced,0.3745439847310384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,4,1,balanced,0.38060800234476727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,4,1,power_law_1.01,0.3410239934921265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,4,1,power_law_1.01,0.34191360473632815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,4,1,power_law_1.2,0.34108800888061525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,4,1,power_law_1.2,0.344870400428772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,8,1,balanced,0.25498666365941364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,8,1,balanced,0.25650133689244586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,8,1,power_law_1.01,0.22782719135284424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,8,1,power_law_1.01,0.2312256097793579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,8,1,power_law_1.2,0.22707839012145997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,6144,2560,8,160,8,1,power_law_1.2,0.2282111883163452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,1,balanced,1.9054080645243328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,1,balanced,1.9133973121643066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,1,power_law_1.01,1.4889280319213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,1,power_law_1.01,1.4987199783325196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,1,power_law_1.2,1.4843456268310546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,1,power_law_1.2,1.5029760360717774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,128,balanced,0.08433600266774495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,128,balanced,0.0849173367023468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,128,power_law_1.01,0.08320639729499817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,128,power_law_1.01,0.08371840119361877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,128,power_law_1.2,0.08261119723320007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,128,power_law_1.2,0.08450559973716736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,16,balanced,0.17789334058761597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,16,balanced,0.1790293256441752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,16,power_law_1.01,0.1614400029182434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,16,power_law_1.01,0.1728767991065979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,16,power_law_1.2,0.17034879922866822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,16,power_law_1.2,0.1710271954536438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,2,balanced,0.9924213091532389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,2,balanced,0.994208017985026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,2,power_law_1.01,0.8073856353759765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,2,power_law_1.01,0.8210240364074707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,2,power_law_1.2,0.7466815948486328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,2,power_law_1.2,0.8325759887695312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,256,balanced,0.07086400190989177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,256,balanced,0.0724426656961441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,256,power_law_1.01,0.06794880032539367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,256,power_law_1.01,0.06951040029525757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,256,power_law_1.2,0.06895359754562377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,256,power_law_1.2,0.0692736029624939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,32,balanced,0.13329600294431052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,32,balanced,0.13591466347376505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,32,power_law_1.01,0.1152959942817688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,32,power_law_1.01,0.12942080497741698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,32,power_law_1.2,0.11545599699020385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,32,power_law_1.2,0.11805440187454223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,4,balanced,0.5384000142415365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,4,balanced,0.5665866533915201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,4,power_law_1.01,0.4267712116241455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,4,power_law_1.01,0.4484799861907959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,4,power_law_1.2,0.45061120986938474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,4,power_law_1.2,0.47492480278015137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,64,balanced,0.1011306643486023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,64,balanced,0.10117333134015401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,64,power_law_1.01,0.0984063982963562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,64,power_law_1.01,0.09849600195884704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,64,power_law_1.2,0.0921343982219696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,64,power_law_1.2,0.0981760025024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,8,balanced,0.29229867458343506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,8,balanced,0.2939786712328593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,8,power_law_1.01,0.2628607988357544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,8,power_law_1.01,0.2633023977279663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,8,power_law_1.2,0.2648576021194458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,1,8,power_law_1.2,0.2734463930130005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,16,1,balanced,0.22104533513387045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,16,1,balanced,0.22342399756113687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,16,1,power_law_1.01,0.1840831995010376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,16,1,power_law_1.01,0.18432639837265014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,16,1,power_law_1.2,0.18044159412384034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,16,1,power_law_1.2,0.18353279829025268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,2,1,balanced,0.9907360076904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,2,1,balanced,1.0093493461608887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,2,1,power_law_1.01,0.7829184055328369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,2,1,power_law_1.01,0.7936895847320556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,2,1,power_law_1.2,0.7704576015472412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,2,1,power_law_1.2,0.7766592025756835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,32,1,balanced,0.18437333901723227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,32,1,balanced,0.1848479906717936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,32,1,power_law_1.01,0.15760639905929566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,32,1,power_law_1.01,0.15886080265045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,32,1,power_law_1.2,0.15861120223999023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,32,1,power_law_1.2,0.1592576026916504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,4,1,balanced,0.5481439828872681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,4,1,balanced,0.5592106580734253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,4,1,power_law_1.01,0.4365695953369141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,4,1,power_law_1.01,0.4369215965270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,4,1,power_law_1.2,0.43260798454284666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,4,1,power_law_1.2,0.4416895866394043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,8,1,balanced,0.339354674021403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,8,1,balanced,0.34164265791575116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,8,1,power_law_1.01,0.28229761123657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,8,1,power_law_1.01,0.28424959182739257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,8,1,power_law_1.2,0.28694400787353513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,256,8,1,power_law_1.2,0.28917760848999025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,1,balanced,2.9547573725382485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,1,balanced,3.0273332595825195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,1,power_law_1.01,1.9602880477905273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,1,power_law_1.01,1.9934783935546876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,1,power_law_1.2,1.9064767837524415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,1,power_law_1.2,1.9153408050537108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,128,balanced,0.09291199843088786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,128,balanced,0.09451733032862346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,128,power_law_1.01,0.09159680008888245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,128,power_law_1.01,0.09292160272598267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,128,power_law_1.2,0.09098880290985108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,128,power_law_1.2,0.09154559969902039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,16,balanced,0.25150400400161743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,16,balanced,0.2600586613019307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,16,power_law_1.01,0.19778560400009154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,16,power_law_1.01,0.2483520030975342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,16,power_law_1.2,0.20028159618377686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,16,power_law_1.2,0.23811841011047363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,2,balanced,1.4522080421447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,2,balanced,1.4847040176391602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,2,power_law_1.01,1.0587072372436523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,2,power_law_1.01,1.0742591857910155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,2,power_law_1.2,1.0339263916015624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,2,power_law_1.2,1.0416768074035645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,32,balanced,0.17123200496037802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,32,balanced,0.17192532618840536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,32,power_law_1.01,0.15036799907684326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,32,power_law_1.01,0.15063040256500243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,32,power_law_1.2,0.14503040313720703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,32,power_law_1.2,0.1476415991783142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,4,balanced,0.7719519933064779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,4,balanced,0.7719946702321371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,4,power_law_1.01,0.5884416103363037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,4,power_law_1.01,0.6291135787963867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,4,power_law_1.2,0.6705664157867431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,4,power_law_1.2,0.699622392654419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,64,balanced,0.11169067025184631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,64,balanced,0.11201066772143047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,64,power_law_1.01,0.10759680271148682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,64,power_law_1.01,0.10958720445632934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,64,power_law_1.2,0.10901119709014892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,64,power_law_1.2,0.10968960523605346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,8,balanced,0.41681599617004395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,8,balanced,0.41816532611846924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,8,power_law_1.01,0.3449215888977051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,8,power_law_1.01,0.41356801986694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,8,power_law_1.2,0.31769599914550783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,1,8,power_law_1.2,0.34565761089324953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,16,1,balanced,0.3221919933954875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,16,1,balanced,0.33104000488917035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,16,1,power_law_1.01,0.2275712013244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,16,1,power_law_1.01,0.23136639595031738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,16,1,power_law_1.2,0.22410879135131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,16,1,power_law_1.2,0.22723839282989503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,2,1,balanced,1.460192044576009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,2,1,balanced,1.4655626614888508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,2,1,power_law_1.01,1.0207488059997558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,2,1,power_law_1.01,1.0319168090820312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,2,1,power_law_1.2,0.9796671867370605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,2,1,power_law_1.2,1.0088128089904784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,32,1,balanced,0.25149865945180255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,32,1,balanced,0.2526773413022359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,32,1,power_law_1.01,0.19052159786224365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,32,1,power_law_1.01,0.19404159784317015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,32,1,power_law_1.2,0.18680959939956665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,32,1,power_law_1.2,0.1870911955833435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,4,1,balanced,0.8010613123575846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,4,1,balanced,0.8063626289367676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,4,1,power_law_1.01,0.5589695930480957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,4,1,power_law_1.01,0.573689603805542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,4,1,power_law_1.2,0.5629695892333985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,4,1,power_law_1.2,0.5631936073303223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,8,1,balanced,0.47413865725199383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,8,1,balanced,0.47549867630004883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,8,1,power_law_1.01,0.34647040367126464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,8,1,power_law_1.01,0.3508863925933838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,8,1,power_law_1.2,0.3391871929168701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,80,7168,2048,8,384,8,1,power_law_1.2,0.3410624027252197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,1,balanced,0.7925706704457601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,1,balanced,0.7934666474660238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,1,power_law_1.01,0.8556672096252441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,1,power_law_1.01,0.8594304084777832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,1,power_law_1.2,0.8655743598937988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,1,power_law_1.2,0.8683584213256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,128,balanced,0.4680853287378947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,128,balanced,0.4696693420410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,128,power_law_1.01,0.494547176361084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,128,power_law_1.01,0.4953728199005127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,128,power_law_1.2,0.5095744132995605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,128,power_law_1.2,0.5104703903198242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,16,balanced,0.49182931582132977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,16,balanced,0.4928106864293416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,16,power_law_1.01,0.5211840152740479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,16,power_law_1.01,0.5258111953735352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,16,power_law_1.2,0.5322624206542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,16,power_law_1.2,0.5349760055541992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,2,balanced,0.6692960262298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,2,balanced,0.6717813014984131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,2,power_law_1.01,0.7303679943084717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,2,power_law_1.01,0.7403200149536133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,2,power_law_1.2,0.7268864154815674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,2,power_law_1.2,0.7424511909484863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,32,balanced,0.4774239857991536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,32,balanced,0.4785333474477132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,32,power_law_1.01,0.5015488147735596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,32,power_law_1.01,0.5181056022644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,32,power_law_1.2,0.5222591876983642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,32,power_law_1.2,0.5223999977111816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,4,balanced,0.5642346541086832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,4,balanced,0.5722453196843466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,4,power_law_1.01,0.6054912090301514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,4,power_law_1.01,0.6185535907745361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,4,power_law_1.2,0.6047488212585449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,4,power_law_1.2,0.6103040218353272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,64,balanced,0.4716000159581502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,64,balanced,0.4731466770172119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,64,power_law_1.01,0.4935999870300293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,64,power_law_1.01,0.49526400566101075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,64,power_law_1.2,0.5139840126037598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,64,power_law_1.2,0.5200831890106201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,8,balanced,0.5134186744689941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,8,balanced,0.5144000053405762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,8,power_law_1.01,0.5536831855773926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,8,power_law_1.01,0.5558591842651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,8,power_law_1.2,0.5634111881256103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,1,8,power_law_1.2,0.584281587600708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,2,1,balanced,0.5681759913762411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,2,1,balanced,0.5681973298390707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,2,1,power_law_1.01,0.6095615863800049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,2,1,power_law_1.01,0.6107264041900635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,2,1,power_law_1.2,0.6131135940551757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,2,1,power_law_1.2,0.6205376148223877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,4,1,balanced,0.4774133364359538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,4,1,balanced,0.4809279839197795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,4,1,power_law_1.01,0.5102272033691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,4,1,power_law_1.01,0.5122176170349121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,4,1,power_law_1.2,0.5133312225341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2048,768,8,128,4,1,power_law_1.2,0.5140543937683105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,1,balanced,1.3561973571777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,1,balanced,1.3849172592163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,1,power_law_1.01,1.5142144203186034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,1,power_law_1.01,1.526848030090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,1,power_law_1.2,1.5531007766723632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,1,power_law_1.2,1.5545856475830078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,128,balanced,0.6014453172683716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,128,balanced,0.6028960148493449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,128,power_law_1.01,0.651801586151123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,128,power_law_1.01,0.6544127941131592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,128,power_law_1.2,0.6905727863311768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,128,power_law_1.2,0.7101759910583496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,16,balanced,0.6502933502197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,16,balanced,0.6536533435185751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,16,power_law_1.01,0.7139391899108887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,16,power_law_1.01,0.7378816127777099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,16,power_law_1.2,0.7249343872070313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,16,power_law_1.2,0.7514495849609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,2,balanced,1.0192906856536865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,2,balanced,1.0213066736857097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,2,power_law_1.01,1.1323391914367675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,2,power_law_1.01,1.1489343643188477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,2,power_law_1.2,1.1646592140197753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,2,power_law_1.2,1.1806271553039551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,32,balanced,0.6232426563898722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,32,balanced,0.6250026623407999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,32,power_law_1.01,0.6773888111114502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,32,power_law_1.01,0.6788352012634278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,32,power_law_1.2,0.7249472141265869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,32,power_law_1.2,0.7551551818847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,4,balanced,0.8179946740468343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,4,balanced,0.8228480021158854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,4,power_law_1.01,0.8793024063110352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,4,power_law_1.01,0.9024959564208984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,4,power_law_1.2,0.9518464088439942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,4,power_law_1.2,0.9535231590270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,64,balanced,0.6092053254445394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,64,balanced,0.6092533270517985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,64,power_law_1.01,0.6554304122924804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,64,power_law_1.01,0.6675072193145752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,64,power_law_1.2,0.7060927867889404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,64,power_law_1.2,0.7092607975006103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,8,balanced,0.7059146563212076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,8,balanced,0.7078133424123129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,8,power_law_1.01,0.7705599784851074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,8,power_law_1.01,0.8191231727600098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,8,power_law_1.2,0.8030207633972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,1,8,power_law_1.2,0.8127231597900391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,16,1,balanced,2.3561760584513345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,16,1,balanced,2.3564160664876304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,16,1,power_law_1.01,2.712428855895996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,16,1,power_law_1.01,2.7236032485961914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,16,1,power_law_1.2,2.745427131652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,16,1,power_law_1.2,2.755449676513672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,2,1,balanced,0.8876000245412191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,2,1,balanced,0.8918826580047607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,2,1,power_law_1.01,0.9816896438598632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,2,1,power_law_1.01,0.9820287704467774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,2,1,power_law_1.2,0.9861120223999024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,2,1,power_law_1.2,0.9951168060302734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,32,1,balanced,2.0534720420837402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,32,1,balanced,2.066373348236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,32,1,power_law_1.01,2.430009651184082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,32,1,power_law_1.01,2.4346303939819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,32,1,power_law_1.2,2.4619775772094727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,32,1,power_law_1.2,2.4711551666259766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,4,1,balanced,0.6498506863911947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,4,1,balanced,0.6506079832712809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,4,1,power_law_1.01,0.7070784091949462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,4,1,power_law_1.01,0.7097216129302979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,4,1,power_law_1.2,0.7088511943817138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,4,1,power_law_1.2,0.7128704071044922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,8,1,balanced,3.0992587407430015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,8,1,balanced,3.103402773539225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,8,1,power_law_1.01,3.5495487213134767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,8,1,power_law_1.01,3.6574462890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,8,1,power_law_1.2,3.6750720977783202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,2688,1856,6,128,8,1,power_law_1.2,3.7355518341064453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,1,balanced,1.7912960052490234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,1,balanced,1.8272587458292644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,1,power_law_1.01,2.033798408508301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,1,power_law_1.01,2.0384511947631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,1,power_law_1.2,2.098963165283203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,1,power_law_1.2,2.124742317199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,128,balanced,0.7134826978047689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,128,balanced,0.7141546408335367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,128,power_law_1.01,0.7539008140563965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,128,power_law_1.01,0.7575424194335938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,128,power_law_1.2,0.7783040046691895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,128,power_law_1.2,0.7939263820648194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,16,balanced,0.7785867055257162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,16,balanced,0.783029317855835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,16,power_law_1.01,0.8412608146667481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,16,power_law_1.01,0.8564288139343261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,16,power_law_1.2,0.8682815551757812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,16,power_law_1.2,0.8977919578552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,2,balanced,1.2830719947814941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,2,balanced,1.2831786473592122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,2,power_law_1.01,1.452012825012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,2,power_law_1.01,1.4630784034729003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,2,power_law_1.2,1.5216640472412108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,2,power_law_1.2,1.550380802154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,256,balanced,0.7096906503041586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,256,balanced,0.7119519710540771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,256,power_law_1.01,0.7368383884429932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,256,power_law_1.01,0.7403456211090088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,256,power_law_1.2,0.7637760162353515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,256,power_law_1.2,0.765337610244751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,32,balanced,0.7427253723144531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,32,balanced,0.7428426742553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,32,power_law_1.01,0.7901567935943603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,32,power_law_1.01,0.8064191818237305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,32,power_law_1.2,0.8171072006225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,32,power_law_1.2,0.8264127731323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,4,balanced,0.9979146321614584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,4,balanced,1.0015947024027507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,4,power_law_1.01,1.1117631912231445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,4,power_law_1.01,1.1143296241760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,4,power_law_1.2,1.1491711616516114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,4,power_law_1.2,1.1723456382751465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,64,balanced,0.7215413252512614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,64,balanced,0.7226719856262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,64,power_law_1.01,0.7664127826690674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,64,power_law_1.01,0.7682559967041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,64,power_law_1.2,0.7931712150573731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,64,power_law_1.2,0.8029055595397949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,8,balanced,0.856544017791748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,8,balanced,0.8632746537526449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,8,power_law_1.01,0.9329792022705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,8,power_law_1.01,0.9495743751525879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,8,power_law_1.2,0.9763968467712403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,1,8,power_law_1.2,0.9819007873535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,16,1,balanced,0.5981013377507528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,16,1,balanced,0.5989013512929281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,16,1,power_law_1.01,0.65797119140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,16,1,power_law_1.01,0.660211181640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,16,1,power_law_1.2,0.664031982421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,16,1,power_law_1.2,0.6670464038848877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,2,1,balanced,1.13210129737854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,2,1,balanced,1.132815996805827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,2,1,power_law_1.01,1.2778112411499023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,2,1,power_law_1.01,1.2836544036865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,2,1,power_law_1.2,1.3063167572021483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,2,1,power_law_1.2,1.3171456336975098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,32,1,balanced,0.5618666807810465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,32,1,balanced,0.5621546506881714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,32,1,power_law_1.01,0.618009614944458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,32,1,power_law_1.01,0.6207871913909913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,32,1,power_law_1.2,0.6270143985748291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,32,1,power_law_1.2,0.6270783901214599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,4,1,balanced,0.8071839809417725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,4,1,balanced,0.807429313659668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,4,1,power_law_1.01,0.8996288299560546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,4,1,power_law_1.01,0.9007295608520508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,4,1,power_law_1.2,0.9155263900756836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,4,1,power_law_1.2,0.9196096420288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,8,1,balanced,0.6754666964213053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,8,1,balanced,0.6757386525472006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,8,1,power_law_1.01,0.7365952014923096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,8,1,power_law_1.01,0.7375679969787597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,8,1,power_law_1.2,0.7531583786010743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,3072,1536,8,256,8,1,power_law_1.2,0.753382396697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,1,balanced,3.761221249898275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,1,balanced,3.77947203318278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,1,power_law_1.01,3.6477119445800783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,1,power_law_1.01,3.7942718505859374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,1,power_law_1.2,3.7223232269287108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,1,power_law_1.2,3.7518848419189452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,2,balanced,2.26366392771403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,2,balanced,2.2978293100992837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,2,power_law_1.01,2.6089599609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,2,power_law_1.01,2.635174369812012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,2,power_law_1.2,2.809574317932129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,2,power_law_1.2,3.057792091369629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,4,balanced,1.6232320467631023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,4,balanced,1.6398132642110188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,4,power_law_1.01,2.2969472885131834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,4,power_law_1.01,2.5390016555786135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,4,power_law_1.2,2.354591941833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,4,power_law_1.2,2.4137535095214844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,8,balanced,1.3185919920603435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,8,balanced,1.3189653555552165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,8,power_law_1.01,2.2333887100219725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,8,power_law_1.01,2.322368049621582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,8,power_law_1.2,2.2946495056152343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,1,8,power_law_1.2,2.31276798248291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,16,1,balanced,0.3920746644337972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,16,1,balanced,0.39324267705281574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,16,1,power_law_1.01,0.3988735914230347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,16,1,power_law_1.01,0.4006336212158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,16,1,power_law_1.2,0.3957184076309204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,16,1,power_law_1.2,0.39803519248962405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,2,1,balanced,1.8095307350158691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,2,1,balanced,1.8959520657857258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,2,1,power_law_1.01,1.8780672073364257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,2,1,power_law_1.01,1.9107519149780274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,2,1,power_law_1.2,1.8654655456542968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,2,1,power_law_1.2,1.8669824600219727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,32,1,balanced,0.30395734310150146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,32,1,balanced,0.3081973393758138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,32,1,power_law_1.01,0.3085439920425415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,32,1,power_law_1.01,0.3105600118637085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,32,1,power_law_1.2,0.3135103940963745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,32,1,power_law_1.2,0.31417601108551024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,4,1,balanced,0.9673973719278971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,4,1,balanced,0.9984959761301676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,4,1,power_law_1.01,0.9969728469848633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,4,1,power_law_1.01,1.0066752433776855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,4,1,power_law_1.2,0.995257568359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,4,1,power_law_1.2,1.0216896057128906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,8,1,balanced,0.5784960190455118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,8,1,balanced,0.5851786533991495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,8,1,power_law_1.01,0.5906432151794434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,8,1,power_law_1.01,0.5961919784545898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,8,1,power_law_1.2,0.5946944236755372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,14336,2,8,8,1,power_law_1.2,0.6005504131317139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,1,balanced,2.0388639767964682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,1,balanced,2.203802744547526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,1,power_law_1.01,2.1974592208862305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,1,power_law_1.01,2.237715148925781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,1,power_law_1.2,2.2139583587646485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,1,power_law_1.2,2.2148672103881837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,128,balanced,0.7835893630981445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,128,balanced,0.7840747038523356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,128,power_law_1.01,0.8512960433959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,128,power_law_1.01,0.86561279296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,128,power_law_1.2,0.9146176338195801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,128,power_law_1.2,0.9177984237670899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,16,balanced,0.8579786618550619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,16,balanced,0.8607199986775717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,16,power_law_1.01,0.9553919792175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,16,power_law_1.01,0.9743488311767579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,16,power_law_1.2,1.0107199668884277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,16,power_law_1.2,1.0478976249694825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,2,balanced,1.453269322713216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,2,balanced,1.4546666145324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,2,power_law_1.01,1.6136640548706054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,2,power_law_1.01,1.6350208282470704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,2,power_law_1.2,1.6910655975341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,2,power_law_1.2,1.6911808013916017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,32,balanced,0.815994660059611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,32,balanced,0.8201759656270345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,32,power_law_1.01,0.9270784378051757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,32,power_law_1.01,0.9304960250854493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,32,power_law_1.2,0.9595904350280762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,32,power_law_1.2,0.9841535568237305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,4,balanced,1.1217280228932698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,4,balanced,1.1231359640757244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,4,power_law_1.01,1.2569024085998535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,4,power_law_1.01,1.2647551536560058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,4,power_law_1.2,1.2867520332336426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,4,power_law_1.2,1.345363235473633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,64,balanced,0.7944373289744059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,64,balanced,0.7955359617869059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,64,power_law_1.01,0.8904191970825195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,64,power_law_1.01,0.8937855720520019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,64,power_law_1.2,0.9339712142944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,64,power_law_1.2,0.949824047088623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,8,balanced,0.9425386587778727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,8,balanced,0.9470986525217692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,8,power_law_1.01,1.065561580657959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,8,power_law_1.01,1.0715392112731934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,8,power_law_1.2,1.1093695640563965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,1,8,power_law_1.2,1.1134528160095214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,16,1,balanced,0.7165119647979736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,16,1,balanced,0.7174133459726969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,16,1,power_law_1.01,0.7634111881256104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,16,1,power_law_1.01,0.7661952018737793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,16,1,power_law_1.2,0.771065616607666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,16,1,power_law_1.2,0.7718912124633789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,2,1,balanced,1.3024213314056396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,2,1,balanced,1.304474671681722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,2,1,power_law_1.01,1.4150400161743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,2,1,power_law_1.01,1.4162240028381348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,2,1,power_law_1.2,1.4319680213928223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,2,1,power_law_1.2,1.4322943687438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,32,1,balanced,0.6729280153910319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,32,1,balanced,0.6735413074493408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,32,1,power_law_1.01,0.7190720081329346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,32,1,power_law_1.01,0.7254144191741944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,32,1,power_law_1.2,0.7291776180267334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,32,1,power_law_1.2,0.7293568134307862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,4,1,balanced,0.944048007329305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,4,1,balanced,0.9461386998494467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,4,1,power_law_1.01,1.013798427581787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,4,1,power_law_1.01,1.0162303924560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,4,1,power_law_1.2,1.0199551582336426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,4,1,power_law_1.2,1.0217280387878418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,8,1,balanced,0.802191972732544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,8,1,balanced,0.802570660909017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,8,1,power_law_1.01,0.8544447898864747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,8,1,power_law_1.01,0.8545791625976562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,8,1,power_law_1.2,0.8543552398681641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,1536,8,128,8,1,power_law_1.2,0.858182430267334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,1,balanced,10.377237319946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,1,balanced,10.509605407714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,1,power_law_1.01,11.123725128173827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,1,power_law_1.01,11.44060821533203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,1,power_law_1.2,11.39183349609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,1,power_law_1.2,11.486815643310546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,128,balanced,2.8025172551472983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,128,balanced,2.8086986541748047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,128,power_law_1.01,2.93493766784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,128,power_law_1.01,2.9408063888549805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,128,power_law_1.2,2.9932159423828124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,128,power_law_1.2,3.019379234313965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,16,balanced,3.193493207295736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,16,balanced,3.2078186670939126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,16,power_law_1.01,3.4336639404296876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,16,power_law_1.01,3.4424896240234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,16,power_law_1.2,3.555775833129883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,16,power_law_1.2,3.666841506958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,2,balanced,6.342101414998372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,2,balanced,6.4224904378255205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,2,power_law_1.01,7.023161315917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,2,power_law_1.01,7.112531280517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,2,power_law_1.2,7.0376129150390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,2,power_law_1.2,7.3655036926269535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,256,balanced,2.7778987884521484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,256,balanced,2.778719902038574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,256,power_law_1.01,2.8748735427856444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,256,power_law_1.01,2.905574417114258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,256,power_law_1.2,2.967846488952637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,256,power_law_1.2,2.97969913482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,32,balanced,2.969162623087565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,32,balanced,2.9847892125447593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,32,power_law_1.01,3.16497917175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,32,power_law_1.01,3.1865407943725588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,32,power_law_1.2,3.2145790100097655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,32,power_law_1.2,3.2620159149169923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,4,balanced,4.472090721130371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,4,balanced,4.48849614461263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,4,power_law_1.01,4.916864013671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,4,power_law_1.01,4.981625747680664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,4,power_law_1.2,5.108575820922852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,4,power_law_1.2,5.165945434570313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,64,balanced,2.8612747192382812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,64,balanced,2.8614025115966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,64,power_law_1.01,3.0267711639404298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,64,power_law_1.01,3.0423168182373046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,64,power_law_1.2,3.1308351516723634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,64,power_law_1.2,3.174425506591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,8,balanced,3.625647862752279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,8,balanced,3.6371466318766275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,8,power_law_1.01,3.9224384307861326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,8,power_law_1.01,3.9403648376464844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,8,power_law_1.2,4.195091247558594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,1,8,power_law_1.2,4.229548645019531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,16,1,balanced,16.986581166585285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,16,1,balanced,17.554181416829426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,16,1,power_law_1.01,19.566496276855467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,16,1,power_law_1.01,19.605317687988283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,16,1,power_law_1.2,19.76640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,16,1,power_law_1.2,20.059097290039062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,2,1,balanced,5.708293279012044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,2,1,balanced,5.965189615885417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,2,1,power_law_1.01,6.207007980346679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,2,1,power_law_1.01,6.381875228881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,2,1,power_law_1.2,6.47900161743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,2,1,power_law_1.2,6.554918670654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,32,1,balanced,12.140416463216146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,32,1,balanced,12.300511678059896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,32,1,power_law_1.01,13.5849853515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,32,1,power_law_1.01,13.673741149902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,32,1,power_law_1.2,13.84637451171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,32,1,power_law_1.2,13.87816925048828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,4,1,balanced,3.6883678436279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,4,1,balanced,3.793055852254232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,4,1,power_law_1.01,3.8972606658935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,4,1,power_law_1.01,3.9778369903564452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,4,1,power_law_1.2,3.9654399871826174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,4,1,power_law_1.2,3.9713088989257814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,8,1,balanced,2.6846612294514975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,8,1,balanced,2.692768096923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,8,1,power_law_1.01,2.795667266845703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,8,1,power_law_1.01,2.8197952270507813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,8,1,power_law_1.2,2.8508480072021483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,4096,2688,22,512,8,1,power_law_1.2,2.8631168365478517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,1,balanced,5.871946970621745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,1,balanced,5.98521614074707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,1,power_law_1.01,5.974515151977539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,1,power_law_1.01,6.276089477539062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,1,power_law_1.2,6.100352096557617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,1,power_law_1.2,6.17154541015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,2,balanced,3.4598185221354165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,2,balanced,3.5737759272257485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,2,power_law_1.01,4.0595134735107425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,2,power_law_1.01,4.076057434082031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,2,power_law_1.2,4.262464141845703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,2,power_law_1.2,4.5328319549560545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,4,balanced,2.2134346961975098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,4,balanced,2.2478133837381997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,4,power_law_1.01,3.421708679199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,4,power_law_1.01,3.4475582122802733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,4,power_law_1.2,3.31591682434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,4,power_law_1.2,3.317740631103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,8,balanced,1.6716853777567546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,8,balanced,1.6790134112040203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,8,power_law_1.01,3.135974311828613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,8,power_law_1.01,3.173017692565918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,8,power_law_1.2,3.1775487899780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,1,8,power_law_1.2,3.300096130371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,16,1,balanced,0.5798879861831665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,16,1,balanced,0.5801013310750326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,16,1,power_law_1.01,0.5859648227691651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,16,1,power_law_1.01,0.5941760063171386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,16,1,power_law_1.2,0.5892223834991455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,16,1,power_law_1.2,0.5901504039764405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,2,1,balanced,2.8878345489501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,2,1,balanced,2.947866757710775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,2,1,power_law_1.01,2.970515251159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,2,1,power_law_1.01,2.995801544189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,2,1,power_law_1.2,2.9687551498413085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,2,1,power_law_1.2,2.9860095977783203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,32,1,balanced,0.43490131696065265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,32,1,balanced,0.43743467330932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,32,1,power_law_1.01,0.43822078704833983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,32,1,power_law_1.01,0.44243202209472654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,32,1,power_law_1.2,0.43739519119262693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,32,1,power_law_1.2,0.4387648105621338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,4,1,balanced,1.5211893717447917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,4,1,balanced,1.5724266370137532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,4,1,power_law_1.01,1.5878399848937987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,4,1,power_law_1.01,1.6089855194091798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,4,1,power_law_1.2,1.564192008972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,4,1,power_law_1.2,1.6035711288452148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,8,1,balanced,0.876693328221639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,8,1,balanced,0.8911306858062744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,8,1,power_law_1.01,0.8964159965515137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,8,1,power_law_1.01,0.9121919631958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,8,1,power_law_1.2,0.9078144073486328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,16384,2,8,8,1,power_law_1.2,0.9085568428039551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,1,balanced,4.254629453023274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,1,balanced,4.432767868041992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,1,power_law_1.01,4.801043319702148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,1,power_law_1.01,4.9233345031738285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,1,power_law_1.2,5.0351806640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,1,power_law_1.2,5.053184127807617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,128,balanced,1.1366986433664958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,128,balanced,1.137178659439087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,128,power_law_1.01,1.2149696350097656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,128,power_law_1.01,1.2314111709594726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,128,power_law_1.2,1.2844927787780762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,128,power_law_1.2,1.3026623725891113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,16,balanced,1.300485372543335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,16,balanced,1.3042186896006267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,16,power_law_1.01,1.4614144325256349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,16,power_law_1.01,1.4859135627746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,16,power_law_1.2,1.5613887786865235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,16,power_law_1.2,1.568064022064209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,2,balanced,2.633135954538981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,2,balanced,2.689861297607422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,2,power_law_1.01,2.9985408782958984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,2,power_law_1.01,3.0673215866088865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,2,power_law_1.2,3.147097587585449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,2,power_law_1.2,3.2047168731689455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,256,balanced,1.123754660288493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,256,balanced,1.1241652965545654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,256,power_law_1.01,1.2010751724243165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,256,power_law_1.01,1.2028736114501952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,256,power_law_1.2,1.294553565979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,256,power_law_1.2,1.2954751968383789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,32,balanced,1.206997315088908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,32,balanced,1.2085333665211995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,32,power_law_1.01,1.3231616020202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,32,power_law_1.01,1.3308799743652344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,32,power_law_1.2,1.4068415641784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,32,power_law_1.2,1.413100814819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,4,balanced,1.8670026461283367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,4,balanced,1.8853492736816406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,4,power_law_1.01,2.1572608947753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,4,power_law_1.01,2.1662912368774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,4,power_law_1.2,2.238502311706543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,4,power_law_1.2,2.245471954345703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,64,balanced,1.1581813494364421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,64,balanced,1.1646347045898438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,64,power_law_1.01,1.2801024436950683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,64,power_law_1.01,1.2915648460388183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,64,power_law_1.2,1.3492032051086427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,64,power_law_1.2,1.3765631675720216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,8,balanced,1.4805067380269368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,8,balanced,1.4954880078633626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,8,power_law_1.01,1.6968191146850586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,8,power_law_1.01,1.7339712142944337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,8,power_law_1.2,1.7901952743530274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,1,8,power_law_1.2,1.8457792282104493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,16,1,balanced,1.0595253308614094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,16,1,balanced,1.0620533625284831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,16,1,power_law_1.01,1.1633472442626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,16,1,power_law_1.01,1.1644736289978028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,16,1,power_law_1.2,1.1817791938781739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,16,1,power_law_1.2,1.1855999946594238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,2,1,balanced,2.378218650817871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,2,1,balanced,2.4521652857462564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,2,1,power_law_1.01,2.7267967224121095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,2,1,power_law_1.01,2.727654457092285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,2,1,power_law_1.2,2.776838493347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,2,1,power_law_1.2,2.8083648681640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,32,1,balanced,0.9799466927846273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,32,1,balanced,0.9802026748657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,32,1,power_law_1.01,1.0829440116882325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,32,1,power_law_1.01,1.0874176025390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,32,1,power_law_1.2,1.0937600135803223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,32,1,power_law_1.2,1.0957504272460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,4,1,balanced,1.5774025917053223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,4,1,balanced,1.5833706855773926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,4,1,power_law_1.01,1.8053247451782226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,4,1,power_law_1.01,1.8124223709106446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,4,1,power_law_1.2,1.8291967391967774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,4,1,power_law_1.2,1.8310527801513672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,8,1,balanced,1.2251040140787761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,8,1,balanced,1.2305973370869954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,8,1,power_law_1.01,1.3751680374145507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,8,1,power_law_1.01,1.3766207695007324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,8,1,power_law_1.2,1.3907391548156738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2048,8,256,8,1,power_law_1.2,1.3938176155090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,1,balanced,5.464698791503906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,1,balanced,5.636277516682942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,1,power_law_1.01,5.048153686523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,1,power_law_1.01,5.205491256713867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,1,power_law_1.2,5.16497917175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,1,power_law_1.2,5.170124816894531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,16,balanced,1.4229493141174316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,16,balanced,1.4252853393554688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,16,power_law_1.01,1.6075519561767577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,16,power_law_1.01,1.6900800704956054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,16,power_law_1.2,1.775257682800293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,16,power_law_1.2,1.7876096725463868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,2,balanced,3.232410748799642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,2,balanced,3.2986666361490884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,2,power_law_1.01,3.273964691162109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,2,power_law_1.01,3.4121856689453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,2,power_law_1.2,3.2994686126708985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,2,power_law_1.2,3.480428695678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,32,balanced,1.2988373438517253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,32,balanced,1.299562692642212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,32,power_law_1.01,1.45797119140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,32,power_law_1.01,1.4650239944458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,32,power_law_1.2,1.5899392127990724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,32,power_law_1.2,1.6267391204833985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,4,balanced,2.167781352996826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,4,balanced,2.175509293874105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,4,power_law_1.01,2.2942783355712892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,4,power_law_1.01,2.341702461242676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,4,power_law_1.2,2.4413312911987304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,4,power_law_1.2,2.540140724182129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,8,balanced,1.6697012583414714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,8,balanced,1.6729706128438313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,8,power_law_1.01,1.8158208847045898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,8,power_law_1.01,1.8400384902954101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,8,power_law_1.2,1.914303970336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,1,8,power_law_1.2,2.029567909240723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,16,1,balanced,1.2259360154469807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,16,1,balanced,1.2264373302459717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,16,1,power_law_1.01,1.220364761352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,16,1,power_law_1.01,1.2222911834716796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,16,1,power_law_1.2,1.2247167587280274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,16,1,power_law_1.2,1.2267519950866699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,2,1,balanced,2.955354690551758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,2,1,balanced,2.9918079376220703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,2,1,power_law_1.01,2.8777088165283202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,2,1,power_law_1.01,2.8813247680664062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,2,1,power_law_1.2,2.884262466430664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,2,1,power_law_1.2,2.9254528045654298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,32,1,balanced,1.1072479883829753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,32,1,balanced,1.1073546409606934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,32,1,power_law_1.01,1.1023232460021972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,32,1,power_law_1.01,1.1077631950378417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,32,1,power_law_1.2,1.1125760078430176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,32,1,power_law_1.2,1.1160832405090333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,4,1,balanced,1.9110080401102703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,4,1,balanced,1.9257653554280598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,4,1,power_law_1.01,1.893177604675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,4,1,power_law_1.01,1.8936128616333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,4,1,power_law_1.2,1.8984960556030273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,4,1,power_law_1.2,1.9018688201904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,8,1,balanced,1.411413351694743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,8,1,balanced,1.4136427243550618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,8,1,power_law_1.01,1.397651195526123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,8,1,power_law_1.01,1.4044480323791504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,8,1,power_law_1.2,1.4110719680786132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,6144,2560,8,160,8,1,power_law_1.2,1.4142399787902833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,1,balanced,4.759605407714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,1,balanced,4.863295873006185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,1,power_law_1.01,5.654694366455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,1,power_law_1.01,5.809734344482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,1,power_law_1.2,5.763455963134765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,1,power_law_1.2,5.886598587036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,128,balanced,1.243066628774007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,128,balanced,1.248581329981486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,128,power_law_1.01,1.3470208168029785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,128,power_law_1.01,1.3666496276855469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,128,power_law_1.2,1.4342335700988769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,128,power_law_1.2,1.4563136100769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,16,balanced,1.4380745887756348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,16,balanced,1.4382133483886719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,16,power_law_1.01,1.6207103729248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,16,power_law_1.01,1.642470359802246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,16,power_law_1.2,1.6879039764404298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,16,power_law_1.2,1.739232063293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,2,balanced,3.0465758641560874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,2,balanced,3.0721705754597983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,2,power_law_1.01,3.4397567749023437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,2,power_law_1.01,3.4579135894775392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,2,power_law_1.2,3.6394878387451173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,2,power_law_1.2,3.680467224121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,256,balanced,1.232917308807373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,256,balanced,1.236202637354533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,256,power_law_1.01,1.320038414001465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,256,power_law_1.01,1.3240192413330079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,256,power_law_1.2,1.4089344024658204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,256,power_law_1.2,1.4493887901306153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,32,balanced,1.3299307028452556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,32,balanced,1.3318666617075603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,32,power_law_1.01,1.4701184272766112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,32,power_law_1.01,1.4713919639587403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,32,power_law_1.2,1.5526720046997071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,32,power_law_1.2,1.5999679565429688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,4,balanced,2.0848800341288247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,4,balanced,2.0856587092081704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,4,power_law_1.01,2.4616512298583983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,4,power_law_1.01,2.4702720642089844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,4,power_law_1.2,2.559008026123047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,4,power_law_1.2,2.591628837585449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,64,balanced,1.270410696665446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,64,balanced,1.2760480244954426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,64,power_law_1.01,1.4156031608581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,64,power_law_1.01,1.4683008193969727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,64,power_law_1.2,1.5056192398071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,64,power_law_1.2,1.5223551750183106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,8,balanced,1.660762627919515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,8,balanced,1.6619200706481934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,8,power_law_1.01,1.8944639205932616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,8,power_law_1.01,1.9315839767456056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,8,power_law_1.2,2.0311296463012694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,1,8,power_law_1.2,2.044236755371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,16,1,balanced,1.2093013127644856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,16,1,balanced,1.2108373641967773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,16,1,power_law_1.01,1.3314240455627442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,16,1,power_law_1.01,1.3315327644348145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,16,1,power_law_1.2,1.345088005065918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,16,1,power_law_1.2,1.3459712028503419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,2,1,balanced,2.7603041330973306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,2,1,balanced,2.7618080774943032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,2,1,power_law_1.01,3.1089216232299806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,2,1,power_law_1.01,3.1688703536987304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,2,1,power_law_1.2,3.152275276184082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,2,1,power_law_1.2,3.2703041076660155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,32,1,balanced,1.116634686787923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,32,1,balanced,1.1179786523183186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,32,1,power_law_1.01,1.2356287956237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,32,1,power_law_1.01,1.2365632057189941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,32,1,power_law_1.2,1.253587245941162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,32,1,power_law_1.2,1.2572480201721192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,4,1,balanced,1.7979040145874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,4,1,balanced,1.8160053888956706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,4,1,power_law_1.01,2.07260799407959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,4,1,power_law_1.01,2.0768320083618166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,4,1,power_law_1.2,2.1030527114868165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,4,1,power_law_1.2,2.109222412109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,8,1,balanced,1.409765402475993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,8,1,balanced,1.4111413955688477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,8,1,power_law_1.01,1.576352024078369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,8,1,power_law_1.01,1.5791935920715332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,8,1,power_law_1.2,1.5894911766052247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,256,8,1,power_law_1.2,1.5965248107910157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,1,balanced,6.72866694132487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,1,balanced,6.7577864329020185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,1,power_law_1.01,6.458560180664063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,1,power_law_1.01,6.705023956298828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,1,power_law_1.2,6.886003112792968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,1,power_law_1.2,6.941484832763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,128,balanced,1.3147679964701335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,128,balanced,1.3158559799194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,128,power_law_1.01,1.389369583129883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,128,power_law_1.01,1.4029952049255372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,128,power_law_1.2,1.4575807571411132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,128,power_law_1.2,1.4662976264953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,16,balanced,1.58898131052653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,16,balanced,1.5927467346191406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,16,power_law_1.01,1.712499237060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,16,power_law_1.01,1.7238784790039063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,16,power_law_1.2,1.7532735824584962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,16,power_law_1.2,1.7556224822998048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,2,balanced,3.9085706075032554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,2,balanced,3.936431884765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,2,power_law_1.01,3.990924835205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,2,power_law_1.01,4.023468780517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,2,power_law_1.2,4.010854339599609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,2,power_law_1.2,4.131321716308594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,32,balanced,1.4331626892089844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,32,balanced,1.4357919692993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,32,power_law_1.01,1.525164794921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,32,power_law_1.01,1.5313920021057128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,32,power_law_1.2,1.5814080238342285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,32,power_law_1.2,1.6231807708740233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,4,balanced,2.511360009511312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,4,balanced,2.5217599868774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,4,power_law_1.01,2.5982784271240233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,4,power_law_1.01,2.6605951309204103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,4,power_law_1.2,2.7634944915771484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,4,power_law_1.2,2.8038015365600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,64,balanced,1.3549920717875164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,64,balanced,1.3565173149108887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,64,power_law_1.01,1.4484224319458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,64,power_law_1.01,1.4584704399108888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,64,power_law_1.2,1.49934720993042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,64,power_law_1.2,1.516646385192871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,8,balanced,1.9058772722880046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,8,balanced,1.9064000447591145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,8,power_law_1.01,2.040332794189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,8,power_law_1.01,2.046131134033203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,8,power_law_1.2,2.0943359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,1,8,power_law_1.2,2.1759807586669924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,16,1,balanced,1.473866621653239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,16,1,balanced,1.4754773775736492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,16,1,power_law_1.01,1.4593088150024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,16,1,power_law_1.01,1.460908794403076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,16,1,power_law_1.2,1.491654396057129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,16,1,power_law_1.2,1.4918527603149414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,2,1,balanced,3.6709651947021484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,2,1,balanced,3.869845390319824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,2,1,power_law_1.01,3.4913089752197264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,2,1,power_law_1.01,3.593868637084961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,2,1,power_law_1.2,3.6669246673583986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,2,1,power_law_1.2,3.7572864532470702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,32,1,balanced,1.3454933166503906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,32,1,balanced,1.3466614087422688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,32,1,power_law_1.01,1.3376959800720214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,32,1,power_law_1.01,1.3377535820007325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,32,1,power_law_1.2,1.358131217956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,32,1,power_law_1.2,1.3608832359313965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,4,1,balanced,2.3110079765319824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,4,1,balanced,2.3245546023050943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,4,1,power_law_1.01,2.2961151123046877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,4,1,power_law_1.01,2.3415679931640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,4,1,power_law_1.2,2.3695167541503905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,4,1,power_law_1.2,2.378335952758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,8,1,balanced,1.7524693806966145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,8,1,balanced,1.7547787030537922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,8,1,power_law_1.01,1.7348608016967773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,8,1,power_law_1.01,1.7351999282836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,8,1,power_law_1.2,1.7719039916992188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,8192,7168,2048,8,384,8,1,power_law_1.2,1.7753856658935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,1,balanced,0.14432533582051596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,1,balanced,0.14587733149528503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,1,power_law_1.01,0.13508479595184325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,1,power_law_1.01,0.13709440231323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,1,power_law_1.2,0.14124159812927245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,1,power_law_1.2,0.14165760278701783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,128,balanced,0.037615999579429626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,128,balanced,0.03789333254098892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,128,power_law_1.01,0.03692159950733185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,128,power_law_1.01,0.03713920116424561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,128,power_law_1.2,0.03717760145664215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,128,power_law_1.2,0.03722879886627197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,16,balanced,0.04171733558177948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,16,balanced,0.04177066683769226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,16,power_law_1.01,0.04010879993438721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,16,power_law_1.01,0.04068480134010315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,16,power_law_1.2,0.039705601334571836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,16,power_law_1.2,0.03985919952392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,2,balanced,0.09780266880989075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,2,balanced,0.09874133268992107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,2,power_law_1.01,0.0932096004486084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,2,power_law_1.01,0.0955839991569519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,2,power_law_1.2,0.09507840275764465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,2,power_law_1.2,0.09773439764976502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,32,balanced,0.039706667264302574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,32,balanced,0.039861333866914116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,32,power_law_1.01,0.037222400307655334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,32,power_law_1.01,0.037363201379776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,32,power_law_1.2,0.037574398517608645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,32,power_law_1.2,0.037651199102401736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,4,balanced,0.07233066856861115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,4,balanced,0.07233599821726482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,4,power_law_1.01,0.06580479741096497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,4,power_law_1.01,0.06584960222244263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,4,power_law_1.2,0.06887680292129517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,4,power_law_1.2,0.07000319957733155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,64,balanced,0.03793599953254064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,64,balanced,0.0397173340121905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,64,power_law_1.01,0.03688960075378418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,64,power_law_1.01,0.03738240003585815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,64,power_law_1.2,0.037376001477241516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,64,power_law_1.2,0.03751679956912994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,8,balanced,0.049957334995269775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,8,balanced,0.051669334371884666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,8,power_law_1.01,0.048607999086380006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,8,power_law_1.01,0.0497408002614975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,8,power_law_1.2,0.049446401000022885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,1,8,power_law_1.2,0.0496832013130188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,2,1,balanced,0.09731200337409973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,2,1,balanced,0.1039680043856303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,2,1,power_law_1.01,0.09376639723777772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,2,1,power_law_1.01,0.09471359848976135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,2,1,power_law_1.2,0.09483519792556763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,2,1,power_law_1.2,0.09566079974174499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,4,1,balanced,0.07053333520889282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,4,1,balanced,0.07283733288447063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,4,1,power_law_1.01,0.0688256025314331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,4,1,power_law_1.01,0.0695680022239685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,4,1,power_law_1.2,0.06841599941253662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2048,768,8,128,4,1,power_law_1.2,0.06910719871520996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,1,balanced,0.3637813329696655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,1,balanced,0.3657279809315999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,1,power_law_1.01,0.31746559143066405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,1,power_law_1.01,0.32585599422454836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,1,power_law_1.2,0.3206592082977295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,1,power_law_1.2,0.33098878860473635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,128,balanced,0.04566933214664459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,128,balanced,0.04753600060939789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,128,power_law_1.01,0.044819200038909913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,128,power_law_1.01,0.04538240134716034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,128,power_law_1.2,0.04500479996204376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,128,power_law_1.2,0.04545280039310455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,16,balanced,0.06806933383146922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,16,balanced,0.06843733290831248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,16,power_law_1.01,0.06506879925727845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,16,power_law_1.01,0.06641280055046081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,16,power_law_1.2,0.06625919938087463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,16,power_law_1.2,0.06640639901161194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,2,balanced,0.21344000101089478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,2,balanced,0.21371199687321982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,2,power_law_1.01,0.18839679956436156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,2,power_law_1.01,0.19303679466247559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,2,power_law_1.2,0.18807679414749146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,2,power_law_1.2,0.19610240459442138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,32,balanced,0.05409599840641022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,32,balanced,0.055914665261904396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,32,power_law_1.01,0.051712000370025636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,32,power_law_1.01,0.05378559827804565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,32,power_law_1.2,0.051795202493667605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,32,power_law_1.2,0.0520576000213623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,4,balanced,0.13432000080744425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,4,balanced,0.13562666376431784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,4,power_law_1.01,0.12380160093307495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,4,power_law_1.01,0.12610559463500975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,4,power_law_1.2,0.12367360591888428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,4,power_law_1.2,0.12409600019454955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,64,balanced,0.045824001232783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,64,balanced,0.047237331668535866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,64,power_law_1.01,0.045049598813056944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,64,power_law_1.01,0.04556800127029419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,64,power_law_1.2,0.04591360092163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,64,power_law_1.2,0.045926401019096376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,8,balanced,0.08932266632715861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,8,balanced,0.09058666229248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,8,power_law_1.01,0.08540800213813782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,8,power_law_1.01,0.08703359961509705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,8,power_law_1.2,0.08600959777832032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,1,8,power_law_1.2,0.08696960210800171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,16,1,balanced,0.7628106276194254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,16,1,balanced,0.7640746434529623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,16,1,power_law_1.01,0.6766784191131592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,16,1,power_law_1.01,0.6927807807922364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,16,1,power_law_1.2,0.6882815837860108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,16,1,power_law_1.2,0.6948863983154296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,2,1,balanced,0.2148853341738383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,2,1,balanced,0.21574934323628744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,2,1,power_law_1.01,0.1859071969985962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,2,1,power_law_1.01,0.18814079761505126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,2,1,power_law_1.2,0.1888703942298889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,2,1,power_law_1.2,0.19370880126953124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,32,1,balanced,0.7457173665364584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,32,1,balanced,0.7482293446858724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,32,1,power_law_1.01,0.6722496032714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,32,1,power_law_1.01,0.6872447967529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,32,1,power_law_1.2,0.6902463912963868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,32,1,power_law_1.2,0.6974016189575195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,4,1,balanced,0.13404267032941183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,4,1,balanced,0.13421333829561868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,4,1,power_law_1.01,0.12289919853210449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,4,1,power_law_1.01,0.1236415982246399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,4,1,power_law_1.2,0.12276480197906495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,4,1,power_law_1.2,0.1247871994972229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,8,1,balanced,1.2631306648254395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,8,1,balanced,1.268666664759318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,8,1,power_law_1.01,1.108467197418213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,8,1,power_law_1.01,1.1309120178222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,8,1,power_law_1.2,1.112076759338379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,2688,1856,6,128,8,1,power_law_1.2,1.1219712257385255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,1,balanced,0.6322986682256063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,1,balanced,0.6375626722971598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,1,power_law_1.01,0.5051583766937255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,1,power_law_1.01,0.5159167766571044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,1,power_law_1.2,0.5051072120666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,1,power_law_1.2,0.5071680068969726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,128,balanced,0.047781333327293396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,128,balanced,0.04805333415667216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,128,power_law_1.01,0.04664320051670075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,128,power_law_1.01,0.04687359929084778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,128,power_law_1.2,0.04707199931144714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,128,power_law_1.2,0.047219198942184445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,16,balanced,0.09470400214195251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,16,balanced,0.09482666850090027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,16,power_law_1.01,0.08403840065002441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,16,power_law_1.01,0.09191679954528809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,16,power_law_1.2,0.07807999849319458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,16,power_law_1.2,0.08375679850578308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,2,balanced,0.34681065877278644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,2,balanced,0.3471733331680298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,2,power_law_1.01,0.27705600261688235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,2,power_law_1.01,0.29252479076385496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,2,power_law_1.2,0.27674880027771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,2,power_law_1.2,0.2923264026641846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,256,balanced,0.04756799836953481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,256,balanced,0.047824000318845115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,256,power_law_1.01,0.045721599459648134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,256,power_law_1.01,0.04636160135269165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,256,power_law_1.2,0.04574080109596253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,256,power_law_1.2,0.04599680006504059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,32,balanced,0.06708799799283345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,32,balanced,0.06950399776299794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,32,power_law_1.01,0.064300799369812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,32,power_law_1.01,0.06680960059165955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,32,power_law_1.2,0.06553599834442139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,32,power_law_1.2,0.06563839912414551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,4,balanced,0.1987733244895935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,4,balanced,0.20102399587631226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,4,power_law_1.01,0.1686336040496826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,4,power_law_1.01,0.17696640491485596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,4,power_law_1.2,0.17006720304489137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,4,power_law_1.2,0.17200000286102296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,64,balanced,0.04971200227737427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,64,balanced,0.04987200101216634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,64,power_law_1.01,0.04816640019416809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,64,power_law_1.01,0.04917120039463043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,64,power_law_1.2,0.04813440144062042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,64,power_law_1.2,0.048416000604629514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,8,balanced,0.1297813355922699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,8,balanced,0.12984533111254373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,8,power_law_1.01,0.11553280353546143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,8,power_law_1.01,0.11783679723739623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,8,power_law_1.2,0.11585919857025147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,1,8,power_law_1.2,0.11906559467315674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,16,1,balanced,0.11334932843844096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,16,1,balanced,0.11375466982523601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,16,1,power_law_1.01,0.09777920246124268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,16,1,power_law_1.01,0.10250879526138305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,16,1,power_law_1.2,0.0989247977733612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,16,1,power_law_1.2,0.09958400130271912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,2,1,balanced,0.35045333703358966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,2,1,balanced,0.35170666376749676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,2,1,power_law_1.01,0.28718719482421873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,2,1,power_law_1.01,0.2948863983154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,2,1,power_law_1.2,0.28488318920135497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,2,1,power_law_1.2,0.28586881160736083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,32,1,balanced,0.0950986643632253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,32,1,balanced,0.09630933403968811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,32,1,power_law_1.01,0.08301439881324768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,32,1,power_law_1.01,0.08385279774665833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,32,1,power_law_1.2,0.08220800161361694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,32,1,power_law_1.2,0.08320000171661376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,4,1,balanced,0.21000534296035767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,4,1,balanced,0.2121653358141581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,4,1,power_law_1.01,0.17601920366287233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,4,1,power_law_1.01,0.17722879648208617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,4,1,power_law_1.2,0.17408000230789183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,4,1,power_law_1.2,0.17663359642028809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,8,1,balanced,0.1498240033785502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,8,1,balanced,0.153221329053243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,8,1,power_law_1.01,0.12390400171279907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,8,1,power_law_1.01,0.12647039890289308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,8,1,power_law_1.2,0.12577919960021972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,3072,1536,8,256,8,1,power_law_1.2,0.12978559732437134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,1,balanced,0.3359626531600952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,1,balanced,0.3363200028737386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,1,power_law_1.01,0.3749248027801514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,1,power_law_1.01,0.38588800430297854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,1,power_law_1.2,0.3733247995376587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,1,power_law_1.2,0.38303360939025877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,2,balanced,0.2258453369140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,2,balanced,0.23958933353424072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,2,power_law_1.01,0.2544384002685547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,2,power_law_1.01,0.2676095962524414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,2,power_law_1.2,0.2569472074508667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,2,power_law_1.2,0.2604543924331665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,4,balanced,0.1607360045115153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,4,balanced,0.1641759971777598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,4,power_law_1.01,0.19884159564971923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,4,power_law_1.01,0.20424959659576417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,4,power_law_1.2,0.19753600358963014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,4,power_law_1.2,0.1997760057449341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,8,balanced,0.1379039982954661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,8,balanced,0.14135467012723288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,8,power_law_1.01,0.1661247968673706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,8,power_law_1.01,0.17204480171203612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,8,power_law_1.2,0.1660223960876465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,1,8,power_law_1.2,0.16824320554733277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,16,1,balanced,0.05392000079154968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,16,1,balanced,0.05434666574001312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,16,1,power_law_1.01,0.062054401636123656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,16,1,power_law_1.01,0.06377599835395813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,16,1,power_law_1.2,0.058956801891326904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,16,1,power_law_1.2,0.06418560147285461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,2,1,balanced,0.19458132982254028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,2,1,balanced,0.2299733360608419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,2,1,power_law_1.01,0.2035520076751709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,2,1,power_law_1.01,0.20728321075439454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,2,1,power_law_1.2,0.2099839925765991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,2,1,power_law_1.2,0.21347200870513916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,32,1,balanced,0.04560533165931702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,32,1,balanced,0.04582933088143667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,32,1,power_law_1.01,0.04431999921798706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,32,1,power_law_1.01,0.044684800505638125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,32,1,power_law_1.2,0.044844800233840944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,32,1,power_law_1.2,0.045023998618125914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,4,1,balanced,0.11485866705576579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,4,1,balanced,0.1165120005607605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,4,1,power_law_1.01,0.1253376007080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,4,1,power_law_1.01,0.12866560220718384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,4,1,power_law_1.2,0.12792320251464845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,4,1,power_law_1.2,0.1283136010169983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,8,1,balanced,0.0800853321949641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,8,1,balanced,0.08015466729799907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,8,1,power_law_1.01,0.08556159734725952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,8,1,power_law_1.01,0.08723199963569642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,8,1,power_law_1.2,0.08654080033302307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,14336,2,8,8,1,power_law_1.2,0.08671360015869141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,1,balanced,0.4442880153656006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,1,balanced,0.4454346497853597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,1,power_law_1.01,0.40622720718383787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,1,power_law_1.01,0.41288318634033205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,1,power_law_1.2,0.4140607833862305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,1,power_law_1.2,0.4273536205291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,128,balanced,0.051269332567850746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,128,balanced,0.05198400219281515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,128,power_law_1.01,0.04997119903564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,128,power_law_1.01,0.05016319751739502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,128,power_law_1.2,0.049747198820114136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,128,power_law_1.2,0.04986880123615265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,16,balanced,0.0807360013326009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,16,balanced,0.08118933439254761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,16,power_law_1.01,0.07731840014457703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,16,power_law_1.01,0.07775359749794006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,16,power_law_1.2,0.07827839851379395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,16,power_law_1.2,0.07913600206375122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,2,balanced,0.2469173272450765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,2,balanced,0.24885867039362589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,2,power_law_1.01,0.23907840251922607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,2,power_law_1.01,0.23922560214996338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,2,power_law_1.2,0.23840639591217042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,2,power_law_1.2,0.24031999111175537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,32,balanced,0.06030400097370148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,32,balanced,0.061306665341059365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,32,power_law_1.01,0.05975679755210876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,32,power_law_1.01,0.06001920104026794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,32,power_law_1.2,0.0611519992351532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,32,power_law_1.2,0.0638592004776001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,4,balanced,0.15517333149909973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,4,balanced,0.15614933768908182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,4,power_law_1.01,0.15112320184707642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,4,power_law_1.01,0.15125759840011596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,4,power_law_1.2,0.1510208010673523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,4,power_law_1.2,0.15103360414505004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,64,balanced,0.05142933130264282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,64,balanced,0.052042668064435325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,64,power_law_1.01,0.05072640180587769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,64,power_law_1.01,0.05080320239067078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,64,power_law_1.2,0.050271999835968015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,64,power_law_1.2,0.05041279792785645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,8,balanced,0.10823999842007954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,8,balanced,0.10946133732795715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,8,power_law_1.01,0.09942399859428405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,8,power_law_1.01,0.10001920461654663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,8,power_law_1.2,0.09920639991760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,1,8,power_law_1.2,0.10405119657516479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,16,1,balanced,0.08826667070388794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,16,1,balanced,0.0899786651134491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,16,1,power_law_1.01,0.08463360071182251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,16,1,power_law_1.01,0.08536959886550903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,16,1,power_law_1.2,0.08510720133781433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,16,1,power_law_1.2,0.08543360233306885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,2,1,balanced,0.24764800071716309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,2,1,balanced,0.2497653365135193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,2,1,power_law_1.01,0.23183999061584473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,2,1,power_law_1.01,0.2386687994003296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,2,1,power_law_1.2,0.2399679899215698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,2,1,power_law_1.2,0.24030721187591553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,32,1,balanced,0.07396266857783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,32,1,balanced,0.07425599793593089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,32,1,power_law_1.01,0.06951680183410644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,32,1,power_law_1.01,0.07090560197830201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,32,1,power_law_1.2,0.0707647979259491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,32,1,power_law_1.2,0.07200639843940734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,4,1,balanced,0.16567466656366983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,4,1,balanced,0.168122669061025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,4,1,power_law_1.01,0.1538879990577698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,4,1,power_law_1.01,0.1544319987297058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,4,1,power_law_1.2,0.15555839538574218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,4,1,power_law_1.2,0.15691519975662233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,8,1,balanced,0.11029866337776184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,8,1,balanced,0.11156800389289856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,8,1,power_law_1.01,0.10531200170516967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,8,1,power_law_1.01,0.10546560287475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,8,1,power_law_1.2,0.1071679949760437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,1536,8,128,8,1,power_law_1.2,0.10717439651489258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,1,balanced,2.890666643778483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,1,balanced,2.924234708150228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,1,power_law_1.01,2.4132863998413088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,1,power_law_1.01,2.428940773010254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,1,power_law_1.2,2.3686592102050783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,1,power_law_1.2,2.5115711212158205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,128,balanced,0.10272000233332317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,128,balanced,0.10321600238482158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,128,power_law_1.01,0.09819520115852357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,128,power_law_1.01,0.09996160268783569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,128,power_law_1.2,0.10109440088272095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,128,power_law_1.2,0.10160640478134156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,16,balanced,0.25677865743637085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,16,balanced,0.258245329062144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,16,power_law_1.01,0.23247361183166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,16,power_law_1.01,0.24035201072692872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,16,power_law_1.2,0.2369920015335083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,16,power_law_1.2,0.2452608108520508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,2,balanced,1.4400053024291992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,2,balanced,1.4449386596679688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,2,power_law_1.01,1.2595135688781738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,2,power_law_1.01,1.2716352462768554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,2,power_law_1.2,1.2335871696472167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,2,power_law_1.2,1.24900484085083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,256,balanced,0.08881066242853801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,256,balanced,0.08956266442934673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,256,power_law_1.01,0.0867904007434845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,256,power_law_1.01,0.08704000115394592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,256,power_law_1.2,0.08648959994316101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,256,power_law_1.2,0.08726400136947632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,32,balanced,0.17463467518488565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,32,balanced,0.17629865805308023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,32,power_law_1.01,0.15327999591827393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,32,power_law_1.01,0.1625856041908264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,32,power_law_1.2,0.15684479475021362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,32,power_law_1.2,0.16124160289764405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,4,balanced,0.7624320189158121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,4,balanced,0.7660906314849854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,4,power_law_1.01,0.6639232158660888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,4,power_law_1.01,0.6844223976135254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,4,power_law_1.2,0.6747647762298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,4,power_law_1.2,0.7044608116149902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,64,balanced,0.12172266840934753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,64,balanced,0.12298132975896199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,64,power_law_1.01,0.1174015998840332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,64,power_law_1.01,0.11924480199813843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,64,power_law_1.2,0.11292159557342529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,64,power_law_1.2,0.11656320095062256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,8,balanced,0.42691198984781903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,8,balanced,0.4280480146408081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,8,power_law_1.01,0.3642688035964966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,8,power_law_1.01,0.37343358993530273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,8,power_law_1.2,0.3710079908370972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,1,8,power_law_1.2,0.392742395401001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,16,1,balanced,7.558245340983073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,16,1,balanced,7.5621388753255205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,16,1,power_law_1.01,6.446009826660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,16,1,power_law_1.01,6.467929840087891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,16,1,power_law_1.2,6.381651306152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,16,1,power_law_1.2,6.532768249511719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,2,1,balanced,1.4507946968078613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,2,1,balanced,1.5421333312988281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,2,1,power_law_1.01,1.2532735824584962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,2,1,power_law_1.01,1.2542079925537108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,2,1,power_law_1.2,1.2388416290283204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,2,1,power_law_1.2,1.260960006713867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,32,1,balanced,4.521253267923991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,32,1,balanced,4.52125867207845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,32,1,power_law_1.01,3.8564990997314452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,32,1,power_law_1.01,3.8826881408691407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,32,1,power_law_1.2,3.834272003173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,32,1,power_law_1.2,3.8539966583251952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,4,1,balanced,0.8120160102844238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,4,1,balanced,0.8139359951019287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,4,1,power_law_1.01,0.7069952011108398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,4,1,power_law_1.01,0.7100224018096923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,4,1,power_law_1.2,0.6943615913391114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,4,1,power_law_1.2,0.6998591899871827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,8,1,balanced,0.48369065920511883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,8,1,balanced,0.49772266546885174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,8,1,power_law_1.01,0.4193215847015381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,8,1,power_law_1.01,0.4201663970947266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,8,1,power_law_1.2,0.4159679889678955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,4096,2688,22,512,8,1,power_law_1.2,0.421235179901123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,1,balanced,0.5170453389485677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,1,balanced,0.5197759866714478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,1,power_law_1.01,0.5956736087799073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,1,power_law_1.01,0.617683219909668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,1,power_law_1.2,0.5941120147705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,1,power_law_1.2,0.6093120098114013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,2,balanced,0.3012853264808655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,2,balanced,0.301418662071228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,2,power_law_1.01,0.3911679983139038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,2,power_law_1.01,0.4039167881011963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,2,power_law_1.2,0.4078656196594238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,2,power_law_1.2,0.4169792175292969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,4,balanced,0.20906132459640503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,4,balanced,0.21357866128285727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,4,power_law_1.01,0.2691263914108276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,4,power_law_1.01,0.28365440368652345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,4,power_law_1.2,0.2695359945297241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,4,power_law_1.2,0.2787584066390991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,8,balanced,0.18095467487970987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,8,balanced,0.18447466691335043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,8,power_law_1.01,0.21967360973358155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,8,power_law_1.01,0.23872001171112062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,8,power_law_1.2,0.2381887912750244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,1,8,power_law_1.2,0.2511552095413208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,16,1,balanced,0.0804799993832906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,16,1,balanced,0.08180800080299377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,16,1,power_law_1.01,0.08380159735679626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,16,1,power_law_1.01,0.08447359800338745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,16,1,power_law_1.2,0.0849407970905304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,16,1,power_law_1.2,0.08515840172767639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,2,1,balanced,0.2800640066464742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,2,1,balanced,0.28252800305684406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,2,1,power_law_1.01,0.3104703903198242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,2,1,power_law_1.01,0.3204927921295166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,2,1,power_law_1.2,0.3105151891708374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,2,1,power_law_1.2,0.3170752048492432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,32,1,balanced,0.05794133245944977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,32,1,balanced,0.058058664202690125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,32,1,power_law_1.01,0.061766397953033444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,32,1,power_law_1.01,0.06276479959487916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,32,1,power_law_1.2,0.061452800035476686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,32,1,power_law_1.2,0.06202239990234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,4,1,balanced,0.16123732924461365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,4,1,balanced,0.16249066591262817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,4,1,power_law_1.01,0.17937920093536378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,4,1,power_law_1.01,0.1794368028640747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,4,1,power_law_1.2,0.17734400033950806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,4,1,power_law_1.2,0.1805184006690979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,8,1,balanced,0.12984533111254373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,8,1,balanced,0.12989866733551025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,8,1,power_law_1.01,0.1146239995956421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,8,1,power_law_1.01,0.11496959924697876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,8,1,power_law_1.2,0.11566720008850098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,16384,2,8,8,1,power_law_1.2,0.1159168004989624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,1,balanced,1.6412426630655925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,1,balanced,1.7049546241760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,1,power_law_1.01,1.3438143730163574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,1,power_law_1.01,1.347231960296631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,1,power_law_1.2,1.279423999786377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,1,power_law_1.2,1.3093759536743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,128,balanced,0.07217066486676534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,128,balanced,0.07281066477298737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,128,power_law_1.01,0.07131519913673401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,128,power_law_1.01,0.07205119729042053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,128,power_law_1.2,0.07190399765968322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,128,power_law_1.2,0.07285760045051574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,16,balanced,0.1590559979279836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,16,balanced,0.15965333580970764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,16,power_law_1.01,0.15482879877090455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,16,power_law_1.01,0.15560959577560424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,16,power_law_1.2,0.14232959747314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,16,power_law_1.2,0.15394560098648072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,2,balanced,0.8582986990610758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,2,balanced,0.8612213134765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,2,power_law_1.01,0.7157440185546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,2,power_law_1.01,0.7354368209838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,2,power_law_1.2,0.7125184059143066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,2,power_law_1.2,0.7155263900756836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,256,balanced,0.06453333298365276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,256,balanced,0.06462400158246358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,256,power_law_1.01,0.0641215980052948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,256,power_law_1.01,0.06469759941101075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,256,power_law_1.2,0.06353920102119445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,256,power_law_1.2,0.06485120058059693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,32,balanced,0.12272000312805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,32,balanced,0.12470933794975281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,32,power_law_1.01,0.10515199899673462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,32,power_law_1.01,0.11327359676361085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,32,power_law_1.2,0.11313920021057129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,32,power_law_1.2,0.11383039951324463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,4,balanced,0.4608000119527181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,4,balanced,0.46855998039245605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,4,power_law_1.01,0.3963007926940918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,4,power_law_1.01,0.43169918060302737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,4,power_law_1.2,0.3985663890838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,4,power_law_1.2,0.43245439529418944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,64,balanced,0.09436266620953877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,64,balanced,0.09498133261998494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,64,power_law_1.01,0.09146239757537841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,64,power_law_1.01,0.09192960262298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,64,power_law_1.2,0.08596479892730713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,64,power_law_1.2,0.09132800102233887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,8,balanced,0.26314665873845416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,8,balanced,0.2653440038363139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,8,power_law_1.01,0.23617279529571533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,8,power_law_1.01,0.25647358894348143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,8,power_law_1.2,0.23147521018981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,1,8,power_law_1.2,0.23605759143829347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,16,1,balanced,0.19514133532842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,16,1,balanced,0.19599467515945435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,16,1,power_law_1.01,0.16673920154571534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,16,1,power_law_1.01,0.16943360567092897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,16,1,power_law_1.2,0.1655295968055725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,16,1,power_law_1.2,0.16873600482940673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,2,1,balanced,0.8572266896565756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,2,1,balanced,0.8590719699859619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,2,1,power_law_1.01,0.6924352169036865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,2,1,power_law_1.01,0.7058944225311279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,2,1,power_law_1.2,0.6820991992950439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,2,1,power_law_1.2,0.702016019821167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,32,1,balanced,0.1623360017935435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,32,1,balanced,0.16267200311024985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,32,1,power_law_1.01,0.1425920009613037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,32,1,power_law_1.01,0.14263039827346802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,32,1,power_law_1.2,0.14250880479812622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,32,1,power_law_1.2,0.14264320135116576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,4,1,balanced,0.48227731386820477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,4,1,balanced,0.4830079873402913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,4,1,power_law_1.01,0.38243200778961184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,4,1,power_law_1.01,0.38558719158172605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,4,1,power_law_1.2,0.3778687953948975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,4,1,power_law_1.2,0.38439040184020995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,8,1,balanced,0.2943466703097026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,8,1,balanced,0.2956106662750244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,8,1,power_law_1.01,0.2540607929229736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,8,1,power_law_1.01,0.2563904047012329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,8,1,power_law_1.2,0.25217280387878416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2048,8,256,8,1,power_law_1.2,0.255679988861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,1,balanced,1.3176266352335613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,1,balanced,1.3472533226013184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,1,power_law_1.01,1.1546048164367675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,1,power_law_1.01,1.1703104019165038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,1,power_law_1.2,1.156275177001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,1,power_law_1.2,1.1607616424560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,16,balanced,0.14895466963450113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,16,balanced,0.14945600430170694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,16,power_law_1.01,0.1325055956840515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,16,power_law_1.01,0.14632960557937622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,16,power_law_1.2,0.1326143980026245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,16,power_law_1.2,0.14446719884872436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,2,balanced,0.6885333061218262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,2,balanced,0.6887146631876627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,2,power_law_1.01,0.6075136184692382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,2,power_law_1.01,0.6113791942596436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,2,power_law_1.2,0.6063488006591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,2,power_law_1.2,0.6246592044830322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,32,balanced,0.10564266641934712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,32,balanced,0.10734400153160095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,32,power_law_1.01,0.10373120307922364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,32,power_law_1.01,0.10607359409332276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,32,power_law_1.2,0.10231679677963257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,32,power_law_1.2,0.1053056001663208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,4,balanced,0.37538135051727295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,4,balanced,0.3779253164927165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,4,power_law_1.01,0.34767999649047854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,4,power_law_1.01,0.35111041069030763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,4,power_law_1.2,0.3339967966079712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,4,power_law_1.2,0.3489023923873901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,8,balanced,0.22819199164708456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,8,balanced,0.23558932542800903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,8,power_law_1.01,0.21701760292053224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,8,power_law_1.01,0.22238080501556395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,8,power_law_1.2,0.21824638843536376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,1,8,power_law_1.2,0.2186880111694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,16,1,balanced,0.17930134137471518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,16,1,balanced,0.17976532379786173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,16,1,power_law_1.01,0.16762239933013917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,16,1,power_law_1.01,0.16822400093078613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,16,1,power_law_1.2,0.1686336040496826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,16,1,power_law_1.2,0.16874239444732667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,2,1,balanced,0.675269365310669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,2,1,balanced,0.6829546292622884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,2,1,power_law_1.01,0.6024447917938233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,2,1,power_law_1.01,0.6133952140808105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,2,1,power_law_1.2,0.606009578704834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,2,1,power_law_1.2,0.6171840190887451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,32,1,balanced,0.1450506647427877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,32,1,balanced,0.14549866318702698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,32,1,power_law_1.01,0.1338047981262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,32,1,power_law_1.01,0.1371392011642456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,32,1,power_law_1.2,0.13470079898834228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,32,1,power_law_1.2,0.13784960508346558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,4,1,balanced,0.37328000863393146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,4,1,balanced,0.3803040186564128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,4,1,power_law_1.01,0.3405632019042969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,4,1,power_law_1.01,0.34603519439697267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,4,1,power_law_1.2,0.347654390335083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,4,1,power_law_1.2,0.35622398853302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,8,1,balanced,0.25413866837819415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,8,1,balanced,0.25539199511210126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,8,1,power_law_1.01,0.22593278884887696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,8,1,power_law_1.01,0.2306368112564087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,8,1,power_law_1.2,0.23109118938446044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,6144,2560,8,160,8,1,power_law_1.2,0.23316481113433837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,1,balanced,1.9183200200398762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,1,balanced,1.924181302388509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,1,power_law_1.01,1.5194496154785155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,1,power_law_1.01,1.532915210723877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,1,power_law_1.2,1.508364772796631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,1,power_law_1.2,1.5191616058349608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,128,balanced,0.08669333656628926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,128,balanced,0.08842133482297261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,128,power_law_1.01,0.08648319840431214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,128,power_law_1.01,0.08679680228233337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,128,power_law_1.2,0.08561919927597046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,128,power_law_1.2,0.08675199747085571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,16,balanced,0.1800373395284017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,16,balanced,0.18232532342274985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,16,power_law_1.01,0.17637759447097778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,16,power_law_1.01,0.17646080255508423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,16,power_law_1.2,0.17325439453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,16,power_law_1.2,0.17434879541397094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,2,balanced,0.9991146723429362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,2,balanced,1.002229372660319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,2,power_law_1.01,0.8052543640136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,2,power_law_1.01,0.8633791923522949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,2,power_law_1.2,0.8323712348937988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,2,power_law_1.2,0.8484864234924316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,256,balanced,0.07281599938869476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,256,balanced,0.07285866638024648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,256,power_law_1.01,0.07049599885940552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,256,power_law_1.01,0.07193599939346314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,256,power_law_1.2,0.07249919772148132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,256,power_law_1.2,0.07256960272789001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,32,balanced,0.1378933290640513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,32,balanced,0.13798933227856955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,32,power_law_1.01,0.11783679723739623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,32,power_law_1.01,0.12842240333557128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,32,power_law_1.2,0.10998400449752807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,32,power_law_1.2,0.12722560167312622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,4,balanced,0.542853315671285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,4,balanced,0.5704906781514486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,4,power_law_1.01,0.4434688091278076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,4,power_law_1.01,0.44606719017028806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,4,power_law_1.2,0.4662975788116455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,4,power_law_1.2,0.4742271900177002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,64,balanced,0.10161599516868591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,64,balanced,0.10433600346247356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,64,power_law_1.01,0.09966080188751221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,64,power_law_1.01,0.10327039957046509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,64,power_law_1.2,0.09414399862289428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,64,power_law_1.2,0.10119040012359619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,8,balanced,0.3001439968744914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,8,balanced,0.3043946623802185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,8,power_law_1.01,0.2782912015914917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,8,power_law_1.01,0.2790015935897827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,8,power_law_1.2,0.2725503921508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,1,8,power_law_1.2,0.29075839519500735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,16,1,balanced,0.22293333212534586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,16,1,balanced,0.22501866022745767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,16,1,power_law_1.01,0.19330559968948363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,16,1,power_law_1.01,0.20176639556884765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,16,1,power_law_1.2,0.19457279443740844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,16,1,power_law_1.2,0.19785599708557128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,2,1,balanced,1.0112053553263347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,2,1,balanced,1.0214080015818279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,2,1,power_law_1.01,0.8042304039001464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,2,1,power_law_1.01,0.8205696105957031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,2,1,power_law_1.2,0.7987648010253906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,2,1,power_law_1.2,0.8066623687744141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,32,1,balanced,0.18500266472498575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,32,1,balanced,0.18588266770044962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,32,1,power_law_1.01,0.16227840185165404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,32,1,power_law_1.01,0.16324479579925538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,32,1,power_law_1.2,0.16001280546188354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,32,1,power_law_1.2,0.16193920373916626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,4,1,balanced,0.5522773265838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,4,1,balanced,0.5600053469340006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,4,1,power_law_1.01,0.4485504150390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,4,1,power_law_1.01,0.4548031806945801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,4,1,power_law_1.2,0.4521471977233887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,4,1,power_law_1.2,0.45765118598937987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,8,1,balanced,0.34146666526794434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,8,1,balanced,0.34346667925516766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,8,1,power_law_1.01,0.29323520660400393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,8,1,power_law_1.01,0.2940864086151123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,8,1,power_law_1.2,0.2931519985198975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,256,8,1,power_law_1.2,0.2935359954833984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,1,balanced,2.984858512878418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,1,balanced,3.0507787068684897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,1,power_law_1.01,2.0398591995239257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,1,power_law_1.01,2.0585344314575194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,1,power_law_1.2,1.9714111328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,1,power_law_1.2,2.0490175247192384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,128,balanced,0.09641066193580627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,128,balanced,0.09672533472379048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,128,power_law_1.01,0.0948095977306366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,128,power_law_1.01,0.09527680277824402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,128,power_law_1.2,0.09336959719657897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,128,power_law_1.2,0.09448959827423095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,16,balanced,0.2526613275210063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,16,balanced,0.25331199169158936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,16,power_law_1.01,0.20779519081115722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,16,power_law_1.01,0.221612811088562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,16,power_law_1.2,0.19367680549621583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,16,power_law_1.2,0.21902079582214357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,2,balanced,1.4814133644104004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,2,balanced,1.5087839762369792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,2,power_law_1.01,1.122777557373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,2,power_law_1.01,1.1363264083862306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,2,power_law_1.2,1.0008319854736327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,2,power_law_1.2,1.0865792274475097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,32,balanced,0.17291200160980225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,32,balanced,0.17457065979639688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,32,power_law_1.01,0.14585599899291993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,32,power_law_1.01,0.15105279684066772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,32,power_law_1.2,0.1443392038345337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,32,power_law_1.2,0.14483840465545655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,4,balanced,0.775386651357015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,4,balanced,0.7756960391998291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,4,power_law_1.01,0.5804287910461425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,4,power_law_1.01,0.6171199798583984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,4,power_law_1.2,0.6166336059570312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,4,power_law_1.2,0.665772819519043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,64,balanced,0.11440533399581909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,64,balanced,0.11623467008272807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,64,power_law_1.01,0.11055999994277954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,64,power_law_1.01,0.11088000535964966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,64,power_law_1.2,0.11070719957351685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,64,power_law_1.2,0.11382399797439575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,8,balanced,0.4213493267695109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,8,balanced,0.42258667945861816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,8,power_law_1.01,0.3723135948181152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,8,power_law_1.01,0.38901119232177733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,8,power_law_1.2,0.34714879989624026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,1,8,power_law_1.2,0.398854398727417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,16,1,balanced,0.3224053382873535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,16,1,balanced,0.32764265934626263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,16,1,power_law_1.01,0.23417599201202394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,16,1,power_law_1.01,0.23491199016571046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,16,1,power_law_1.2,0.2326335906982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,16,1,power_law_1.2,0.23338239192962645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,2,1,balanced,1.4669334093729656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,2,1,balanced,1.4751893679300945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,2,1,power_law_1.01,1.0599231719970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,2,1,power_law_1.01,1.0779775619506835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,2,1,power_law_1.2,1.033561611175537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,2,1,power_law_1.2,1.0408703804016113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,32,1,balanced,0.2526400089263916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,32,1,balanced,0.25339200099309284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,32,1,power_law_1.01,0.20182399749755858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,32,1,power_law_1.01,0.20454399585723876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,32,1,power_law_1.2,0.19159679412841796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,32,1,power_law_1.2,0.19368319511413573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,4,1,balanced,0.8018666903177897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,4,1,balanced,0.810149351755778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,4,1,power_law_1.01,0.5940927982330322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,4,1,power_law_1.01,0.6022784233093261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,4,1,power_law_1.2,0.5716351985931396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,4,1,power_law_1.2,0.5771647930145264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,8,1,balanced,0.47782401243845624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,8,1,balanced,0.47886931896209717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,8,1,power_law_1.01,0.35519359111785886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,8,1,power_law_1.01,0.35727360248565676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,8,1,power_law_1.2,0.35203840732574465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8,96,7168,2048,8,384,8,1,power_law_1.2,0.35389440059661864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,1,balanced,0.03137599925200144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,1,balanced,0.03161599983771642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,1,power_law_1.01,0.030028799176216127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,1,power_law_1.01,0.03027839958667755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,1,power_law_1.2,0.030086401104927062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,1,power_law_1.2,0.030937600135803222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,128,balanced,0.03753600021203359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,128,balanced,0.03758399933576584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,128,power_law_1.01,0.034227201342582704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,128,power_law_1.01,0.03592320084571839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,128,power_law_1.2,0.03455359935760498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,128,power_law_1.2,0.035104000568389894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,16,balanced,0.03537066777547201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,16,balanced,0.03570133447647095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,16,power_law_1.01,0.03529599905014038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,16,power_law_1.01,0.03534719944000244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,16,power_law_1.2,0.03511680066585541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,16,power_law_1.2,0.03535360097885132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,2,balanced,0.03559466699759165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,2,balanced,0.0377866675456365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,2,power_law_1.01,0.0353408008813858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,2,power_law_1.01,0.035795199871063235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,2,power_law_1.2,0.035488000512123107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,2,power_law_1.2,0.03656319975852966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,32,balanced,0.035573333501815796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,32,balanced,0.03585066646337509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,32,power_law_1.01,0.03470720052719116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,32,power_law_1.01,0.03621760010719299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,32,power_law_1.2,0.03495680093765259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,32,power_law_1.2,0.035743999481201175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,4,balanced,0.04179200033346812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,4,balanced,0.043824002146720886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,4,power_law_1.01,0.0354559987783432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,4,power_law_1.01,0.03575679957866669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,4,power_law_1.2,0.035411199927330016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,4,power_law_1.2,0.03553920090198517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,64,balanced,0.03565333286921183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,64,balanced,0.03579733272393545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,64,power_law_1.01,0.03399679958820343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,64,power_law_1.01,0.03550719916820526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,64,power_law_1.2,0.03484799861907959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,64,power_law_1.2,0.035846400260925296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,8,balanced,0.0356480007370313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,8,balanced,0.03736000011364619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,8,power_law_1.01,0.0347135990858078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,8,power_law_1.01,0.035699200630187986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,8,power_law_1.2,0.03524479866027832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,1,8,power_law_1.2,0.03573760092258453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,2,1,balanced,0.02959999938805898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,2,1,balanced,0.029994666576385498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,2,1,power_law_1.01,0.028281599283218384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,2,1,power_law_1.01,0.028288000822067262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,2,1,power_law_1.2,0.027910399436950683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,2048,768,8,128,2,1,power_law_1.2,0.02800000011920929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,1,balanced,0.05392533540725708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,1,balanced,0.05537599821885427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,1,power_law_1.01,0.052825599908828735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,1,power_law_1.01,0.05363199710845947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,1,power_law_1.2,0.05359359979629517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,1,power_law_1.2,0.05392640233039856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,128,balanced,0.041749333341916404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,128,balanced,0.04264533519744873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,128,power_law_1.01,0.040345600247383116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,128,power_law_1.01,0.04217599928379059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,128,power_law_1.2,0.04066559970378876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,128,power_law_1.2,0.04140160083770752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,16,balanced,0.041738669077555336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,16,balanced,0.04180799921353658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,16,power_law_1.01,0.05914239883422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,16,power_law_1.01,0.05945600271224975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,16,power_law_1.2,0.057062399387359616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,16,power_law_1.2,0.0590719997882843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,2,balanced,0.04385066529115041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,2,balanced,0.05192000170548757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,2,power_law_1.01,0.057580798864364624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,2,power_law_1.01,0.05975679755210876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,2,power_law_1.2,0.05917440056800842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,2,power_law_1.2,0.05975040197372437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,256,balanced,0.04364799956480662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,256,balanced,0.043706665436426796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,256,power_law_1.01,0.04169600009918213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,256,power_law_1.01,0.04175359904766083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,256,power_law_1.2,0.041868799924850465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,256,power_law_1.2,0.04220159947872162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,32,balanced,0.04179200033346812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,32,balanced,0.041893333196640015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,32,power_law_1.01,0.05754240155220032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,32,power_law_1.01,0.05857279896736145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,32,power_law_1.2,0.057894402742385866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,32,power_law_1.2,0.05896959900856018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,4,balanced,0.04364266494909922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,4,balanced,0.043791999419530235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,4,power_law_1.01,0.0576960027217865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,4,power_law_1.01,0.05896959900856018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,4,power_law_1.2,0.056729602813720706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,4,power_law_1.2,0.05944960117340088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,64,balanced,0.04171733558177948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,64,balanced,0.04179200033346812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,64,power_law_1.01,0.04184960126876831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,64,power_law_1.01,0.044531199336051944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,64,power_law_1.2,0.04345600008964538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,64,power_law_1.2,0.04350079894065857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,8,balanced,0.043477331598599754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,8,balanced,0.04562133550643921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,8,power_law_1.01,0.05928320288658142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,8,power_law_1.01,0.059648001194000246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,8,power_law_1.2,0.05813760161399841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,1,8,power_law_1.2,0.05880320072174072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,2,1,balanced,0.04173333446184794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,2,1,balanced,0.04174399872620901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,2,1,power_law_1.01,0.03590399920940399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,2,1,power_law_1.01,0.036595198512077334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,2,1,power_law_1.2,0.03472639918327332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,2,1,power_law_1.2,0.03493120074272156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,4,1,balanced,0.03365866591533025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,4,1,balanced,0.033759998778502144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,4,1,power_law_1.01,0.03192319869995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,4,1,power_law_1.01,0.032416000962257385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,4,1,power_law_1.2,0.032492798566818235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,3072,1536,8,256,4,1,power_law_1.2,0.03253119885921478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,1,balanced,0.13530133167902628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,1,balanced,0.1360106666882833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,1,power_law_1.01,0.13388160467147828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,1,power_law_1.01,0.1353600025177002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,1,power_law_1.2,0.13501440286636351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,1,power_law_1.2,0.1369279980659485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,2,balanced,0.13377066453297934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,2,balanced,0.1448319951693217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,2,power_law_1.01,0.1318400025367737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,2,power_law_1.01,0.1396607995033264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,2,power_law_1.2,0.12821760177612304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,2,power_law_1.2,0.13645440340042114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,4,balanced,0.12710400422414145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,4,balanced,0.1295146644115448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,4,power_law_1.01,0.12534400224685668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,4,power_law_1.01,0.12549760341644287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,4,power_law_1.2,0.13647359609603882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,4,power_law_1.2,0.15551359653472902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,8,balanced,0.126991997162501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,8,balanced,0.12774399916330972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,8,power_law_1.01,0.12606719732284546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,8,power_law_1.01,0.12613760232925414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,8,power_law_1.2,0.1261504054069519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,1,8,power_law_1.2,0.12679040431976318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,16,1,balanced,0.03755733370780945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,16,1,balanced,0.037690666814645134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,16,1,power_law_1.01,0.03531520068645477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,16,1,power_law_1.01,0.0356799989938736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,16,1,power_law_1.2,0.04010240137577057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,16,1,power_law_1.2,0.04403199851512909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,2,1,balanced,0.08437866965929668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,2,1,balanced,0.09949866930643718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,2,1,power_law_1.01,0.0831488013267517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,2,1,power_law_1.01,0.08442879915237426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,2,1,power_law_1.2,0.0837823987007141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,2,1,power_law_1.2,0.09548799991607666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,4,1,balanced,0.06112533311049143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,4,1,balanced,0.06433066725730896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,4,1,power_law_1.01,0.06193280220031738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,4,1,power_law_1.01,0.06912639737129211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,4,1,power_law_1.2,0.05914880037307739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,4,1,power_law_1.2,0.0593280017375946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,8,1,balanced,0.04170133173465729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,8,1,balanced,0.04172799984614054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,8,1,power_law_1.01,0.04672000110149384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,8,1,power_law_1.01,0.04785279929637909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,8,1,power_law_1.2,0.04583680033683777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,14336,2,8,8,1,power_law_1.2,0.05467519760131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,1,balanced,0.06140799820423126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,1,balanced,0.06191466748714447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,1,power_law_1.01,0.05923839807510376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,1,power_law_1.01,0.060115200281143186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,1,power_law_1.2,0.059628802537918094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,1,power_law_1.2,0.05979520082473755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,128,balanced,0.04570133487383524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,128,balanced,0.04600533346335093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,128,power_law_1.01,0.044863998889923096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,128,power_law_1.01,0.04519039988517761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,128,power_law_1.2,0.0451200008392334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,128,power_law_1.2,0.045363199710845944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,16,balanced,0.04553600152333578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,16,balanced,0.046165332198143005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,16,power_law_1.01,0.06484479904174804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,16,power_law_1.01,0.06714879870414733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,16,power_law_1.2,0.06540160179138184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,16,power_law_1.2,0.06552960276603699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,2,balanced,0.051669334371884666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,2,balanced,0.05599466462930044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,2,power_law_1.01,0.06503040194511414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,2,power_law_1.01,0.06547200083732604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,2,power_law_1.2,0.06433280110359192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,2,power_law_1.2,0.06666880249977111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,32,balanced,0.04584000011285146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,32,balanced,0.04771733283996582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,32,power_law_1.01,0.0490880012512207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,32,power_law_1.01,0.053260797262191774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,32,power_law_1.2,0.04987519979476929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,32,power_law_1.2,0.054816001653671266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,4,balanced,0.045909335215886436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,4,balanced,0.045935998360315956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,4,power_law_1.01,0.06499840021133423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,4,power_law_1.01,0.06614400148391723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,4,power_law_1.2,0.06474879980087281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,4,power_law_1.2,0.06611199975013733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,64,balanced,0.04587733248869578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,64,power_law_1.01,0.04493440091609955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,64,power_law_1.01,0.044940799474716187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,64,power_law_1.2,0.044844800233840944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,64,power_law_1.2,0.04519680142402649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,8,balanced,0.04577599962552389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,8,balanced,0.046069333950678505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,8,power_law_1.01,0.06517120003700257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,8,power_law_1.01,0.06567040085792542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,8,power_law_1.2,0.06395519971847534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,1,8,power_law_1.2,0.0658240020275116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,2,1,balanced,0.04372799893220266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,2,1,balanced,0.04539200166861216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,2,1,power_law_1.01,0.04242559969425201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,2,1,power_law_1.01,0.04247680008411407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,2,1,power_law_1.2,0.041433599591255185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,2,1,power_law_1.2,0.043993601202964784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,4,1,balanced,0.037690666814645134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,4,1,balanced,0.0377866675456365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,4,1,power_law_1.01,0.03596799969673157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,4,1,power_law_1.01,0.036883199214935304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,4,1,power_law_1.2,0.0359935998916626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,1536,8,128,4,1,power_law_1.2,0.03644160032272339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,1,balanced,0.1646453340848287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,1,balanced,0.16713599363962808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,1,power_law_1.01,0.16213760375976563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,1,power_law_1.01,0.16455680131912231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,1,power_law_1.2,0.16216959953308105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,1,power_law_1.2,0.16320639848709106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,128,balanced,0.05173333485921224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,128,balanced,0.052042668064435325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,128,power_law_1.01,0.07227519750595093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,128,power_law_1.01,0.07301759719848633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,128,power_law_1.2,0.07132160067558288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,128,power_law_1.2,0.07214080095291138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,16,balanced,0.05650666852792104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,16,balanced,0.06362133224805196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,16,power_law_1.01,0.168230402469635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,16,power_law_1.01,0.16844799518585205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,16,power_law_1.2,0.16751999855041505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,16,power_law_1.2,0.16788480281829835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,2,balanced,0.10079999764760335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,2,balanced,0.10383466879526775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,2,power_law_1.01,0.16761599779129027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,2,power_law_1.01,0.169977605342865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,2,power_law_1.2,0.16885759830474853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,2,power_law_1.2,0.1689919948577881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,256,balanced,0.0517439991235733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,256,balanced,0.052000001072883606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,256,power_law_1.01,0.05390080213546753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,256,power_law_1.01,0.05610880255699158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,256,power_law_1.2,0.056492799520492555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,256,power_law_1.2,0.05785599946975708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,32,balanced,0.05205333232879639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,32,balanced,0.05213333169619242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,32,power_law_1.01,0.13704960346221923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,32,power_law_1.01,0.1390720009803772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,32,power_law_1.2,0.13602559566497802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,32,power_law_1.2,0.13642879724502563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,4,balanced,0.07869333525498708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,4,balanced,0.08113066852092743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,4,power_law_1.01,0.1696768045425415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,4,power_law_1.01,0.16969599723815917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,4,power_law_1.2,0.16792960166931153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,4,power_law_1.2,0.16830079555511473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,64,balanced,0.051728000243504844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,64,balanced,0.05193600058555603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,64,power_law_1.01,0.08702719807624817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,64,power_law_1.01,0.0880128026008606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,64,power_law_1.2,0.08567039966583252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,64,power_law_1.2,0.08791040182113648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,8,balanced,0.07625066737333934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,8,balanced,0.07735466460386912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,8,power_law_1.01,0.16677759885787963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,8,power_law_1.01,0.16909439563751222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,8,power_law_1.2,0.16728960275650023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,4096,2688,22,512,1,8,power_law_1.2,0.16805119514465333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,1,balanced,0.17901867628097534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,1,balanced,0.180074671904246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,1,power_law_1.01,0.17729920148849487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,1,power_law_1.01,0.17738239765167235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,1,power_law_1.2,0.1767040014266968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,1,power_law_1.2,0.176800000667572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,2,balanced,0.18635733922322592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,2,balanced,0.1899999976158142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,2,power_law_1.01,0.16230399608612062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,2,power_law_1.01,0.2173248052597046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,2,power_law_1.2,0.16769920587539672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,2,power_law_1.2,0.17801599502563475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,4,balanced,0.15986133615175882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,4,balanced,0.16309866309165955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,4,power_law_1.01,0.15674879550933837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,4,power_law_1.01,0.16637439727783204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,4,power_law_1.2,0.15670399665832518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,4,power_law_1.2,0.16353919506072997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,8,balanced,0.15891200304031372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,8,balanced,0.15948800245920816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,8,power_law_1.01,0.1561344027519226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,8,power_law_1.01,0.15627520084381102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,8,power_law_1.2,0.1554751992225647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,1,8,power_law_1.2,0.18568320274353028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,16,1,balanced,0.043840001026789345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,16,1,balanced,0.04580266773700714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,16,1,power_law_1.01,0.04989440143108368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,16,1,power_law_1.01,0.05137280225753784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,16,1,power_law_1.2,0.05294079780578613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,16,1,power_law_1.2,0.05304960012435913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,2,1,balanced,0.10937066872914632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,2,1,balanced,0.11544000109036763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,2,1,power_law_1.01,0.10599039793014527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,2,1,power_law_1.01,0.10959359407424926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,2,1,power_law_1.2,0.10661120414733886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,2,1,power_law_1.2,0.11281919479370117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,32,1,balanced,0.0436160018046697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,32,1,balanced,0.043749332427978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,32,1,power_law_1.01,0.042854401469230655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,32,1,power_law_1.01,0.04408960044384003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,32,1,power_law_1.2,0.04362240135669708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,32,1,power_law_1.2,0.04364160001277924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,4,1,balanced,0.07694399853547414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,4,1,balanced,0.09122666716575623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,4,1,power_law_1.01,0.07404800057411194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,4,1,power_law_1.01,0.074099200963974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,4,1,power_law_1.2,0.0742143988609314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,4,1,power_law_1.2,0.08511360287666321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,8,1,balanced,0.058789332707722984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,8,1,balanced,0.06233599781990051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,8,1,power_law_1.01,0.06865280270576476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,8,1,power_law_1.01,0.07008000016212464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,8,1,power_law_1.2,0.06087039709091187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,16384,2,8,8,1,power_law_1.2,0.061401599645614625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,1,balanced,0.0864586631457011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,1,balanced,0.08660266796747844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,1,power_law_1.01,0.08446720242500305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,1,power_law_1.01,0.08569599986076355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,1,power_law_1.2,0.08460800051689148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,1,power_law_1.2,0.08603519797325135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,128,balanced,0.05409599840641022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,128,balanced,0.05595199763774872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,128,power_law_1.01,0.06020479798316956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,128,power_law_1.01,0.06590080261230469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,128,power_law_1.2,0.05868800282478333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,128,power_law_1.2,0.061990398168563846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,16,balanced,0.056090667843818665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,16,balanced,0.05716800192991892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,16,power_law_1.01,0.08899199962615967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,16,power_law_1.01,0.08990079760551453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,16,power_law_1.2,0.08977919816970825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,16,power_law_1.2,0.09085440039634704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,2,balanced,0.07599466542402904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,2,balanced,0.07640000184377034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,2,power_law_1.01,0.08986240029335021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,2,power_law_1.01,0.0898688018321991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,2,power_law_1.2,0.08929280042648316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,2,power_law_1.2,0.09096320271492005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,256,balanced,0.05500266452630361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,256,balanced,0.05606399973233541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,256,power_law_1.01,0.05297920107841492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,256,power_law_1.01,0.05446400046348572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,256,power_law_1.2,0.053286397457122804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,256,power_law_1.2,0.055238401889801024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,32,balanced,0.05592533449331919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,32,balanced,0.056218668818473816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,32,power_law_1.01,0.09157119989395142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,32,power_law_1.01,0.09274880290031433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,32,power_law_1.2,0.08931840062141419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,32,power_law_1.2,0.09038720130920411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,4,balanced,0.06030400097370148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,4,balanced,0.0620959997177124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,4,power_law_1.01,0.09091839790344239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,4,power_law_1.01,0.09118720293045043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,4,power_law_1.2,0.09007999897003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,4,power_law_1.2,0.09035519957542419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,64,balanced,0.0539680023988088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,64,balanced,0.05630399783452352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,64,power_law_1.01,0.07414399981498718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,64,power_law_1.01,0.07428479790687562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,64,power_law_1.2,0.07395200133323669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,64,power_law_1.2,0.07519999742507935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,8,balanced,0.05413866539796194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,8,balanced,0.06011199951171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,8,power_law_1.01,0.08556159734725952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,8,power_law_1.01,0.08701440095901489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,8,power_law_1.2,0.08659840226173401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,1,8,power_law_1.2,0.0871295988559723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,16,1,balanced,0.04386133452256521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,16,1,balanced,0.04409599800904592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,16,1,power_law_1.01,0.04154239892959595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,16,1,power_law_1.01,0.04224640130996704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,16,1,power_law_1.2,0.04190079867839813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,16,1,power_law_1.2,0.04246399998664856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,2,1,balanced,0.0660693347454071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,2,1,balanced,0.0661599983771642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,2,1,power_law_1.01,0.06484479904174804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,2,1,power_law_1.01,0.06500480175018311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,2,1,power_law_1.2,0.06440320014953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,2,1,power_law_1.2,0.06531199812889099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,4,1,balanced,0.05172266562779745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,4,1,balanced,0.05208000044027964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,4,1,power_law_1.01,0.04855040013790131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,4,1,power_law_1.01,0.04906240105628967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,4,1,power_law_1.2,0.04789760112762451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,4,1,power_law_1.2,0.050892800092697144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,8,1,balanced,0.03913066784540812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,8,1,balanced,0.03965333352486292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,8,1,power_law_1.01,0.03797760009765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,8,1,power_law_1.01,0.03808000087738037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,8,1,power_law_1.2,0.037171199917793274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2048,8,256,8,1,power_law_1.2,0.03772160112857818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,1,balanced,0.10094400246938069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,1,balanced,0.10146666566530864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,1,power_law_1.01,0.09741439819335937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,1,power_law_1.01,0.0979200005531311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,1,power_law_1.2,0.09713919758796692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,1,power_law_1.2,0.09800320267677307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,16,balanced,0.058090666929880776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,16,balanced,0.058389330903689064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,16,power_law_1.01,0.1020095944404602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,16,power_law_1.01,0.1027135968208313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,16,power_law_1.2,0.10205440521240235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,16,power_law_1.2,0.1026304006576538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,2,balanced,0.08366933465003967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,2,balanced,0.08452266454696655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,2,power_law_1.01,0.1020799994468689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,2,power_law_1.01,0.10325759649276733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,2,power_law_1.2,0.10175360441207885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,2,power_law_1.2,0.10195200443267823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,32,balanced,0.05795733133951823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,32,balanced,0.058890665570894875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,32,power_law_1.01,0.0853056013584137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,32,power_law_1.01,0.08766080141067505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,32,power_law_1.2,0.08579840064048767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,32,power_law_1.2,0.0858240008354187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,4,balanced,0.06422933439413707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,4,balanced,0.06459733347098033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,4,power_law_1.01,0.10034559965133667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,4,power_law_1.01,0.10207359790802002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,4,power_law_1.2,0.09943040013313294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,4,power_law_1.2,0.10044159889221191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,8,balanced,0.05797333518664042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,8,balanced,0.05827199916044871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,8,power_law_1.01,0.1
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,8,power_law_1.01,0.1020799994468689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,8,power_law_1.2,0.10132479667663574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,1,8,power_law_1.2,0.10172799825668336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,2,1,balanced,0.07232533395290375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,2,1,balanced,0.07432533303896587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,2,1,power_law_1.01,0.07128959894180298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,2,1,power_law_1.01,0.07217280268669128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,2,1,power_law_1.2,0.07117440104484558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,2,1,power_law_1.2,0.07132800221443177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,4,1,balanced,0.053898667295773826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,4,1,balanced,0.055573334296544395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,4,1,power_law_1.01,0.05370240211486817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,4,1,power_law_1.01,0.055353599786758426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,4,1,power_law_1.2,0.05243520140647888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,6144,2560,8,160,4,1,power_law_1.2,0.0536191999912262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,1,balanced,0.09489599863688152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,1,balanced,0.09733866651852925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,1,power_law_1.01,0.0955839991569519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,1,power_law_1.01,0.09720320105552674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,1,power_law_1.2,0.09516800045967103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,1,power_law_1.2,0.09637119770050048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,128,balanced,0.05811200042565664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,128,balanced,0.060090666015942894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,128,power_law_1.01,0.07180799841880799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,128,power_law_1.01,0.07338879704475403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,128,power_law_1.2,0.075135999917984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,128,power_law_1.2,0.07564160227775574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,16,balanced,0.058149332801500954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,16,balanced,0.05961066484451294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,16,power_law_1.01,0.09880959987640381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,16,power_law_1.01,0.10031360387802124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,16,power_law_1.2,0.09850879907608032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,16,power_law_1.2,0.09920639991760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,2,balanced,0.08076266447703044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,2,balanced,0.0823413332303365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,2,power_law_1.01,0.09969279766082764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,2,power_law_1.01,0.09983360171318054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,2,power_law_1.2,0.10021120309829712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,2,power_law_1.2,0.10169600248336792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,256,balanced,0.06002666552861532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,256,balanced,0.06353066861629486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,256,power_law_1.01,0.0568448007106781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,256,power_law_1.01,0.0581055998802185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,256,power_law_1.2,0.05759360194206238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,256,power_law_1.2,0.058278399705886844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,32,balanced,0.05871999760468801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,32,balanced,0.05935466786225637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,32,power_law_1.01,0.1011072039604187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,32,power_law_1.01,0.10145920515060425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,32,power_law_1.2,0.09976320266723633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,32,power_law_1.2,0.10131839513778687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,4,balanced,0.07123733560244243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,4,balanced,0.07434133191903432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,4,power_law_1.01,0.09905920028686524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,4,power_law_1.01,0.09996799826622009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,4,power_law_1.2,0.10028799772262573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,4,power_law_1.2,0.10075520277023316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,64,balanced,0.059994667768478394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,64,balanced,0.06401066482067108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,64,power_law_1.01,0.08038399815559387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,64,power_law_1.01,0.08044160008430482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,64,power_law_1.2,0.0802944004535675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,64,power_law_1.2,0.08121600151062011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,8,balanced,0.05801066756248474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,8,balanced,0.059562668204307556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,8,power_law_1.01,0.09496960043907166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,8,power_law_1.01,0.09529600143432618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,8,power_law_1.2,0.09662079811096191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,1,8,power_law_1.2,0.0973695993423462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,16,1,balanced,0.045706664522488914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,16,1,balanced,0.04626133541266123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,16,1,power_law_1.01,0.04510720074176788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,16,1,power_law_1.01,0.04519680142402649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,16,1,power_law_1.2,0.046003198623657225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,16,1,power_law_1.2,0.0461760014295578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,2,1,balanced,0.07289066910743713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,2,1,balanced,0.07380799949169159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,2,1,power_law_1.01,0.07127040028572082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,2,1,power_law_1.01,0.07160959839820862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,2,1,power_law_1.2,0.07036799788475037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,2,1,power_law_1.2,0.07126399874687195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,4,1,balanced,0.0580320010582606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,4,1,balanced,0.058378666639328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,4,1,power_law_1.01,0.056460797786712646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,4,1,power_law_1.01,0.05668479800224304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,4,1,power_law_1.2,0.055936002731323244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,4,1,power_law_1.2,0.05730559825897217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,8,1,balanced,0.043621331453323364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,8,1,balanced,0.045754666129748024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,8,1,power_law_1.01,0.04141440093517303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,8,1,power_law_1.01,0.04209280014038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,8,1,power_law_1.2,0.041433599591255185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,256,8,1,power_law_1.2,0.04159359931945801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,1,balanced,0.09637332955996196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,1,balanced,0.09890666604042053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,1,power_law_1.01,0.09409919977188111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,1,power_law_1.01,0.09604480266571044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,1,power_law_1.2,0.09381759762763978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,1,power_law_1.2,0.09612159729003907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,128,balanced,0.060080001751581825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,128,balanced,0.060218666990598045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,128,power_law_1.01,0.07767040133476258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,128,power_law_1.01,0.07788159847259521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,128,power_law_1.2,0.07752959728240967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,128,power_law_1.2,0.07949439883232116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,16,balanced,0.05820799867312113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,16,balanced,0.059877331058184304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,16,power_law_1.01,0.0997376024723053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,16,power_law_1.01,0.10009599924087524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,16,power_law_1.2,0.099891197681427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,16,power_law_1.2,0.10004479885101318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,2,balanced,0.08072000245253245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,2,balanced,0.08241066833337148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,2,power_law_1.01,0.10255359411239624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,2,power_law_1.01,0.10291199684143067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,2,power_law_1.2,0.10111360549926758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,2,power_law_1.2,0.10151040554046631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,32,balanced,0.05839466551939646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,32,balanced,0.062309334675470986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,32,power_law_1.01,0.10085120201110839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,32,power_law_1.01,0.10113279819488526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,32,power_law_1.2,0.10062719583511352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,32,power_law_1.2,0.1019327998161316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,4,balanced,0.07601066430409749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,4,balanced,0.07670400043328603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,4,power_law_1.01,0.09928320050239563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,4,power_law_1.01,0.10235519409179687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,4,power_law_1.2,0.10046080350875855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,4,power_law_1.2,0.10098559856414795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,64,balanced,0.0599839985370636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,64,balanced,0.06402666866779327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,64,power_law_1.01,0.09106559753417968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,64,power_law_1.01,0.09163519740104675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,64,power_law_1.2,0.09050880074501037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,64,power_law_1.2,0.09088000059127807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,8,balanced,0.05818133552869161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,8,balanced,0.0609386662642161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,8,power_law_1.01,0.09921919703483581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,8,power_law_1.01,0.1007423996925354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,8,power_law_1.2,0.09978240132331848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,1,8,power_law_1.2,0.10038399696350098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,16,1,balanced,0.047744000951449074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,16,1,balanced,0.047877331574757896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,16,1,power_law_1.01,0.04557439982891083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,16,1,power_law_1.01,0.04602240025997162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,16,1,power_law_1.2,0.045747199654579164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,16,1,power_law_1.2,0.04657280147075653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,2,1,balanced,0.07136533161004384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,2,1,balanced,0.07238933444023132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,2,1,power_law_1.01,0.07098879814147949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,2,1,power_law_1.01,0.0711296021938324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,2,1,power_law_1.2,0.07078400254249573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,2,1,power_law_1.2,0.07100160121917724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,4,1,balanced,0.06469333171844482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,4,1,balanced,0.06623999774456024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,4,1,power_law_1.01,0.060601598024368285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,4,1,power_law_1.01,0.06270719766616821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,4,1,power_law_1.2,0.06185600161552429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,4,1,power_law_1.2,0.06280320286750793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,8,1,balanced,0.051829333106676735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,8,1,balanced,0.05349866549173991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,8,1,power_law_1.01,0.04798080027103424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,8,1,power_law_1.01,0.048742398619651794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,8,1,power_law_1.2,0.04759680032730103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1,7168,2048,8,384,8,1,power_law_1.2,0.04766719937324524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,1,balanced,0.28809599081675213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,1,balanced,0.29020800193150836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,1,power_law_1.01,0.3687551975250244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,1,power_law_1.01,0.3694272041320801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,1,power_law_1.2,0.3786688089370728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,1,power_law_1.2,0.37971200942993166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,128,balanced,0.11243733763694763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,128,balanced,0.11426132917404175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,128,power_law_1.01,0.11584000587463379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,128,power_law_1.01,0.11684479713439941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,128,power_law_1.2,0.12254719734191895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,128,power_law_1.2,0.12360320091247559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,16,balanced,0.12550399700800577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,16,power_law_1.01,0.1384511947631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,16,power_law_1.01,0.14055039882659912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,16,power_law_1.2,0.14364800453186036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,16,power_law_1.2,0.14661120176315307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,2,balanced,0.20815465847651163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,2,balanced,0.20891199509302774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,2,power_law_1.01,0.26010239124298096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,2,power_law_1.01,0.26267518997192385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,2,power_law_1.2,0.2605504035949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,2,power_law_1.2,0.2728384017944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,32,balanced,0.11796266833941142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,32,balanced,0.12107200423876445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,32,power_law_1.01,0.1245695948600769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,32,power_law_1.01,0.1295807957649231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,32,power_law_1.2,0.13036799430847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,32,power_law_1.2,0.13612159490585327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,4,balanced,0.16192533572514853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,4,balanced,0.16387200355529785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,4,power_law_1.01,0.19365760087966918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,4,power_law_1.01,0.1940287947654724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,4,power_law_1.2,0.19998719692230224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,4,power_law_1.2,0.20081920623779298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,64,balanced,0.11550399661064148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,64,balanced,0.11928533514340718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,64,power_law_1.01,0.12104959487915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,64,power_law_1.01,0.12330880165100097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,64,power_law_1.2,0.1253376007080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,64,power_law_1.2,0.12695679664611817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,8,balanced,0.13596266508102417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,8,balanced,0.13621866703033447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,8,power_law_1.01,0.15595519542694092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,8,power_law_1.01,0.15763839483261108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,8,power_law_1.2,0.15965440273284912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,1,8,power_law_1.2,0.1652992010116577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,2,1,balanced,0.18425599733988443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,2,1,balanced,0.18502400318781534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,2,1,power_law_1.01,0.23365120887756347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,2,1,power_law_1.01,0.23431038856506348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,2,1,power_law_1.2,0.23758718967437745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,2048,768,8,128,2,1,power_law_1.2,0.2397439956665039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,1,balanced,1.1572799682617188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,1,balanced,1.1586506366729736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,1,power_law_1.01,1.2710975646972655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,1,power_law_1.01,1.2745792388916015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,1,power_law_1.2,1.341260814666748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,1,power_law_1.2,1.343449592590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,128,balanced,0.20547733704249063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,128,balanced,0.20618132750193277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,128,power_law_1.01,0.21598079204559326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,128,power_law_1.01,0.21751039028167723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,128,power_law_1.2,0.22481279373168944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,128,power_law_1.2,0.2266688108444214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,16,balanced,0.2653226653734843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,16,balanced,0.26715733607610065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,16,power_law_1.01,0.285536003112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,16,power_law_1.01,0.29103360176086424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,16,power_law_1.2,0.29617919921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,16,power_law_1.2,0.29998719692230225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,2,balanced,0.6972106297810873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,2,balanced,0.698479970296224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,2,power_law_1.01,0.7730688095092774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,2,power_law_1.01,0.7823552131652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,2,power_law_1.2,0.7929344177246094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,2,power_law_1.2,0.8003583908081054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,256,balanced,0.2023573319117228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,256,balanced,0.20346667369206747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,256,power_law_1.01,0.20885119438171387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,256,power_law_1.01,0.21016321182250977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,256,power_law_1.2,0.21505279541015626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,256,power_law_1.2,0.2151103973388672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,32,balanced,0.22936532894770303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,32,balanced,0.22975466648737589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,32,power_law_1.01,0.2511359930038452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,32,power_law_1.01,0.25306239128112795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,32,power_law_1.2,0.25575039386749265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,32,power_law_1.2,0.2562560081481934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,4,balanced,0.45666666825612384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,4,balanced,0.4575413465499878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,4,power_law_1.01,0.4956672191619873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,4,power_law_1.01,0.49954562187194823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,4,power_law_1.2,0.5228479862213135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,4,power_law_1.2,0.5239808082580566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,64,balanced,0.21270400285720825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,64,balanced,0.2131040096282959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,64,power_law_1.01,0.2261120080947876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,64,power_law_1.01,0.226476788520813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,64,power_law_1.2,0.2337023973464966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,64,power_law_1.2,0.2385472059249878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,8,balanced,0.33049599329630536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,8,balanced,0.331984003384908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,8,power_law_1.01,0.3612864017486572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,8,power_law_1.01,0.3666752099990845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,8,power_law_1.2,0.38373761177062987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,1,8,power_law_1.2,0.38467841148376464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,2,1,balanced,0.6559840043385824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,2,1,balanced,0.6566986640294393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,2,1,power_law_1.01,0.7133503913879394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,2,1,power_law_1.01,0.7213312149047851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,2,1,power_law_1.2,0.7581888198852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,2,1,power_law_1.2,0.7635456085205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,4,1,balanced,0.4078559875488281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,4,1,balanced,0.4081759850184123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,4,1,power_law_1.01,0.43810558319091797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,4,1,power_law_1.01,0.43854718208312987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,4,1,power_law_1.2,0.45185279846191406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,3072,1536,8,256,4,1,power_law_1.2,0.4572159767150879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,1,balanced,1.5512213706970215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,1,balanced,1.5520799954732258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,1,power_law_1.01,1.6580543518066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,1,power_law_1.01,1.6651775360107421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,1,power_law_1.2,1.646886444091797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,1,power_law_1.2,1.6673728942871093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,2,balanced,0.9084266821543375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,2,balanced,0.9092533588409424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,2,power_law_1.01,1.1225152015686035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,2,power_law_1.01,1.1979968070983886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,2,power_law_1.2,1.1051775932312011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,2,power_law_1.2,1.3278656005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,4,balanced,0.5741333166758219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,4,balanced,0.5769759813944498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,4,power_law_1.01,1.0411199569702148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,4,power_law_1.01,1.0760128021240234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,4,power_law_1.2,0.9036224365234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,4,power_law_1.2,0.9956416130065918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,8,balanced,0.4657653172810872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,8,balanced,0.4670399824778239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,8,power_law_1.01,0.7850048065185546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,8,power_law_1.01,0.8119808197021484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,8,power_law_1.2,0.8454463958740235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,1,8,power_law_1.2,0.8492992401123047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,16,1,balanced,0.16061333815256754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,16,1,balanced,0.1623199979464213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,16,1,power_law_1.01,0.1658687949180603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,16,1,power_law_1.01,0.1672127962112427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,16,1,power_law_1.2,0.16632959842681885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,16,1,power_law_1.2,0.16658560037612916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,2,1,balanced,0.8081333637237549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,2,1,balanced,0.8096480369567871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,2,1,power_law_1.01,0.8656319618225098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,2,1,power_law_1.01,0.8711039543151855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,2,1,power_law_1.2,0.8513088226318359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,2,1,power_law_1.2,0.8531264305114746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,4,1,balanced,0.44571201006571454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,4,1,balanced,0.44787200291951496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,4,1,power_law_1.01,0.4553664207458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,4,1,power_law_1.01,0.45706877708435056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,4,1,power_law_1.2,0.46229119300842286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,4,1,power_law_1.2,0.4739583969116211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,8,1,balanced,0.2646933396657308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,8,1,balanced,0.26532800992329914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,8,1,power_law_1.01,0.27064321041107176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,8,1,power_law_1.01,0.2724096059799194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,8,1,power_law_1.2,0.27073919773101807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,14336,2,8,8,1,power_law_1.2,0.27392001152038575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,1,balanced,0.8360746701558431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,1,balanced,0.8388693332672119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,1,power_law_1.01,1.1603967666625976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,1,power_law_1.01,1.1721216201782227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,1,power_law_1.2,1.1989055633544923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,1,power_law_1.2,1.2053376197814942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,128,balanced,0.20186134179433188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,128,balanced,0.2032639980316162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,128,power_law_1.01,0.21807360649108887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,128,power_law_1.01,0.21935360431671141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,128,power_law_1.2,0.2358975887298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,128,power_law_1.2,0.23893120288848876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,16,balanced,0.23439466953277588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,16,balanced,0.237664004166921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,16,power_law_1.01,0.2977792024612427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,16,power_law_1.01,0.2982208013534546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,16,power_law_1.2,0.31127679347991943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,16,power_law_1.2,0.31290879249572756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,2,balanced,0.5368426640828451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,2,balanced,0.5383146603902181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,2,power_law_1.01,0.7059264183044434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,2,power_law_1.01,0.7362304210662842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,2,power_law_1.2,0.7329919815063477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,2,power_law_1.2,0.7469567775726318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,32,balanced,0.210207998752594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,32,balanced,0.21242666244506836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,32,power_law_1.01,0.2539968013763428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,32,power_law_1.01,0.25849599838256837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,32,power_law_1.2,0.26940159797668456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,32,power_law_1.2,0.2758016109466553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,4,balanced,0.36534400780995685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,4,balanced,0.3656533161799113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,4,power_law_1.01,0.4665408134460449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,4,power_law_1.01,0.4881472110748291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,4,power_law_1.2,0.5119743824005127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,4,power_law_1.2,0.514028787612915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,64,balanced,0.20418665806452432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,64,balanced,0.2058453361193339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,64,power_law_1.01,0.2334912061691284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,64,power_law_1.01,0.2358783960342407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,64,power_law_1.2,0.2440959930419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,64,power_law_1.2,0.24993278980255126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,8,balanced,0.27955732742945355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,8,balanced,0.27962666749954224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,8,power_law_1.01,0.3544447898864746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,8,power_law_1.01,0.3575615882873535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,8,power_law_1.2,0.3689984083175659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,1,8,power_law_1.2,0.38744320869445803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,2,1,balanced,0.4996480147043864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,2,1,balanced,0.5000373522440592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,2,1,power_law_1.01,0.6561279773712159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,2,1,power_law_1.01,0.6595007896423339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,2,1,power_law_1.2,0.6622335910797119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,2,1,power_law_1.2,0.6772799968719483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,4,1,balanced,0.31146132946014404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,4,1,balanced,0.31153066953023273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,4,1,power_law_1.01,0.40956802368164064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,4,1,power_law_1.01,0.4111743927001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,4,1,power_law_1.2,0.4111487865447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,1536,8,128,4,1,power_law_1.2,0.415283203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,1,balanced,5.084671974182129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,1,balanced,5.089290618896484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,1,power_law_1.01,6.32174072265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,1,power_law_1.01,6.348710250854492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,1,power_law_1.2,6.507148742675781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,1,power_law_1.2,6.509190368652344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,128,balanced,0.7392799854278564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,128,balanced,0.7415786584218343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,128,power_law_1.01,0.7892096042633057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,128,power_law_1.01,0.798041582107544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,128,power_law_1.2,0.820025634765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,128,power_law_1.2,0.8238143920898438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,16,balanced,0.9890666802724203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,16,balanced,0.9944852987925211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,16,power_law_1.01,1.1362751960754394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,16,power_law_1.01,1.1512831687927245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,16,power_law_1.2,1.222879981994629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,16,power_law_1.2,1.2231167793273925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,2,balanced,2.934965451558431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,2,balanced,2.9371414184570312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,2,power_law_1.01,3.5848320007324217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,2,power_law_1.01,3.598944091796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,2,power_law_1.2,3.6838016510009766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,2,power_law_1.2,3.696249771118164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,256,balanced,0.7240906556447347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,256,balanced,0.7282559871673584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,256,power_law_1.01,0.7668543815612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,256,power_law_1.01,0.7677440166473388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,256,power_law_1.2,0.7876416206359863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,256,power_law_1.2,0.791590404510498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,32,balanced,0.8472159703572592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,32,balanced,0.8474453290303549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,32,power_law_1.01,0.9495488166809082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,32,power_law_1.01,0.9630911827087403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,32,power_law_1.2,0.9688256263732911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,32,power_law_1.2,0.9822848320007325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,4,balanced,1.8284053802490234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,4,balanced,1.8325120608011882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,4,power_law_1.01,2.195840072631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,4,power_law_1.01,2.2418495178222657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,4,power_law_1.2,2.2254592895507814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,4,power_law_1.2,2.308639907836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,64,balanced,0.7773386637369791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,64,balanced,0.7797386646270752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,64,power_law_1.01,0.841055965423584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,64,power_law_1.01,0.848639965057373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,64,power_law_1.2,0.874233627319336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,64,power_law_1.2,0.9056063652038574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,8,balanced,1.2760852972666423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,8,balanced,1.2788906892140706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,8,power_law_1.01,1.5083328247070313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,8,power_law_1.01,1.512607955932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,8,power_law_1.2,1.5565119743347169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,4096,2688,22,512,1,8,power_law_1.2,1.5761024475097656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,1,balanced,2.4795947074890137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,1,balanced,2.480639934539795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,1,power_law_1.01,2.7065792083740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,1,power_law_1.01,2.710758399963379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,1,power_law_1.2,2.6769344329833986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,1,power_law_1.2,2.6900800704956054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,2,balanced,1.3871466318766277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,2,balanced,1.3886826833089192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,2,power_law_1.01,1.8470016479492188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,2,power_law_1.01,1.8664960861206055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,2,power_law_1.2,1.8916671752929688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,2,power_law_1.2,2.2657024383544924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,4,balanced,0.8985919952392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,4,balanced,0.8995947043100992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,4,power_law_1.01,1.4519743919372559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,4,power_law_1.01,1.4774399757385255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,4,power_law_1.2,1.4548352241516114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,4,power_law_1.2,1.5718208312988282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,8,balanced,0.5970346530278524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,8,balanced,0.5972640117009481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,8,power_law_1.01,1.2881919860839843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,8,power_law_1.01,1.3143744468688965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,8,power_law_1.2,1.1993280410766602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,1,8,power_law_1.2,1.3153152465820312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,16,1,balanced,0.22935465971628824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,16,1,balanced,0.23079999287923178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,16,1,power_law_1.01,0.23636479377746583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,16,1,power_law_1.01,0.23672959804534913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,16,1,power_law_1.2,0.2363840103149414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,16,1,power_law_1.2,0.24695041179656982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,2,1,balanced,1.26909335454305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,2,1,balanced,1.2706720034281414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,2,1,power_law_1.01,1.3716608047485352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,2,1,power_law_1.01,1.3753215789794921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,2,1,power_law_1.2,1.3658047676086427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,2,1,power_law_1.2,1.3660736083984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,32,1,balanced,0.1492586632569631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,32,1,balanced,0.15054399768511453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,32,1,power_law_1.01,0.151910400390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,32,1,power_law_1.01,0.15226240158081056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,32,1,power_law_1.2,0.15159039497375487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,32,1,power_law_1.2,0.1518720030784607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,4,1,balanced,0.6670826276143392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,4,1,balanced,0.668608029683431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,4,1,power_law_1.01,0.7239168167114258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,4,1,power_law_1.01,0.7275199890136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,4,1,power_law_1.2,0.7188799858093262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,4,1,power_law_1.2,0.7236735820770264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,8,1,balanced,0.39266133308410645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,8,1,balanced,0.39293332894643146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,8,1,power_law_1.01,0.39983999729156494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,8,1,power_law_1.01,0.41408638954162597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,8,1,power_law_1.2,0.4005887985229492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,16384,2,8,8,1,power_law_1.2,0.41877121925354005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,1,balanced,2.775877316792806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,1,balanced,2.777770678202311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,1,power_law_1.01,3.100627136230469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,1,power_law_1.01,3.128447914123535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,1,power_law_1.2,3.2118270874023436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,1,power_law_1.2,3.2135360717773436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,128,balanced,0.33109333117802936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,128,balanced,0.3315040071805318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,128,power_law_1.01,0.35732479095458985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,128,power_law_1.01,0.36008319854736326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,128,power_law_1.2,0.37777280807495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,128,power_law_1.2,0.38056321144104005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,16,balanced,0.4697493314743042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,16,balanced,0.47339733441670734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,16,power_law_1.01,0.5370560169219971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,16,power_law_1.01,0.5407551765441895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,16,power_law_1.2,0.5348864078521729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,16,power_law_1.2,0.5471615791320801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,2,balanced,1.5624160766601562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,2,balanced,1.566245396931966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,2,power_law_1.01,1.7493247985839844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,2,power_law_1.01,1.7682432174682616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,2,power_law_1.2,1.8350528717041015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,2,power_law_1.2,1.8749376296997071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,256,balanced,0.3237280050913493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,256,balanced,0.32443734010060626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,256,power_law_1.01,0.34248321056365966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,256,power_law_1.01,0.3440256118774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,256,power_law_1.2,0.3592832088470459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,256,power_law_1.2,0.362009596824646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,32,balanced,0.39159464836120605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,32,balanced,0.3919839859008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,32,power_law_1.01,0.4386879920959473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,32,power_law_1.01,0.44165759086608886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,32,power_law_1.2,0.46190719604492186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,32,power_law_1.2,0.4619328022003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,4,balanced,0.9481066862742106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,4,balanced,0.9482933680216471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,4,power_law_1.01,1.0589056015014648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,4,power_law_1.01,1.0590720176696777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,4,power_law_1.2,1.109337615966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,4,power_law_1.2,1.1360320091247558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,64,balanced,0.3468053340911865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,64,balanced,0.3470453421274821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,64,power_law_1.01,0.38754560947418215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,64,power_law_1.01,0.38944640159606936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,64,power_law_1.2,0.39895679950714114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,64,power_law_1.2,0.41376638412475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,8,balanced,0.6166186730066935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,8,balanced,0.6177653471628824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,8,power_law_1.01,0.706982421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,8,power_law_1.01,0.7256768226623536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,8,power_law_1.2,0.7401088237762451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,1,8,power_law_1.2,0.7567808151245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,16,1,balanced,0.42636267344156903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,16,1,balanced,0.4285866816838582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,16,1,power_law_1.01,0.4855679988861084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,16,1,power_law_1.01,0.48611202239990237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,16,1,power_law_1.2,0.503001594543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,16,1,power_law_1.2,0.5032896041870117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,2,1,balanced,1.4963253339131672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,2,1,balanced,1.4965173403422039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,2,1,power_law_1.01,1.6654272079467773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,2,1,power_law_1.01,1.6787967681884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,2,1,power_law_1.2,1.754265594482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,2,1,power_law_1.2,1.7551103591918946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,4,1,balanced,0.8494666417439779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,4,1,balanced,0.8496853510538737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,4,1,power_law_1.01,0.9534784317016601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,4,1,power_law_1.01,0.965004825592041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,4,1,power_law_1.2,0.9817407608032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,4,1,power_law_1.2,0.9900992393493653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,8,1,balanced,0.4668266773223877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,8,1,balanced,0.47145068645477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,8,1,power_law_1.01,0.541318416595459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,8,1,power_law_1.01,0.5463359832763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,8,1,power_law_1.2,0.5718719959259033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2048,8,256,8,1,power_law_1.2,0.5723008155822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,1,balanced,2.251130739847819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,1,balanced,2.25163205464681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,1,power_law_1.01,2.985247993469238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,1,power_law_1.01,2.9875455856323243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,1,power_law_1.2,3.061235237121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,1,power_law_1.2,3.097011184692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,16,balanced,0.42768001556396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,16,balanced,0.42976001898447674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,16,power_law_1.01,0.5518847942352295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,16,power_law_1.01,0.5544000148773194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,16,power_law_1.2,0.5737919807434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,16,power_law_1.2,0.5811327934265137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,2,balanced,1.2985386848449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,2,balanced,1.2992266813913982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,2,power_law_1.01,1.7138431549072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,2,power_law_1.01,1.729497528076172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,2,power_law_1.2,1.778803253173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,2,power_law_1.2,1.800057601928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,32,balanced,0.36182932058970135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,32,balanced,0.3636000156402588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,32,power_law_1.01,0.4706431865692139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,32,power_law_1.01,0.4737088203430176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,32,power_law_1.2,0.4691775798797607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,32,power_law_1.2,0.49939842224121095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,4,balanced,0.8004266421000162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,4,balanced,0.8027413686116537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,4,power_law_1.01,1.067404842376709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,4,power_law_1.01,1.0729536056518554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,4,power_law_1.2,1.0835200309753419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,4,power_law_1.2,1.090828800201416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,8,balanced,0.55403733253479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,8,balanced,0.5555520057678223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,8,power_law_1.01,0.7180223941802979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,8,power_law_1.01,0.7290495872497559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,8,power_law_1.2,0.7499072074890136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,1,8,power_law_1.2,0.7851776123046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,2,1,balanced,1.2184853553771973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,2,1,balanced,1.2186559836069744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,2,1,power_law_1.01,1.6145280838012694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,2,1,power_law_1.01,1.6179071426391602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,2,1,power_law_1.2,1.6652544021606446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,2,1,power_law_1.2,1.6722623825073242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,4,1,balanced,0.7273973623911539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,4,1,balanced,0.7278613249460856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,4,1,power_law_1.01,0.8988800048828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,4,1,power_law_1.01,0.9174655914306641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,4,1,power_law_1.2,0.9371904373168946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,6144,2560,8,160,4,1,power_law_1.2,0.9390399932861329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,1,balanced,3.2140000661214194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,1,balanced,3.2170079549153647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,1,power_law_1.01,3.584128189086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,1,power_law_1.01,3.639424133300781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,1,power_law_1.2,3.7761470794677736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,1,power_law_1.2,3.781363296508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,128,balanced,0.35871466000874835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,128,balanced,0.360096017519633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,128,power_law_1.01,0.39246718883514403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,128,power_law_1.01,0.3992448091506958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,128,power_law_1.2,0.40769281387329104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,128,power_law_1.2,0.4142144203186035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,16,balanced,0.5231573184331259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,16,balanced,0.5246933301289877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,16,power_law_1.01,0.5901567935943604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,16,power_law_1.01,0.5920703887939454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,16,power_law_1.2,0.6189824104309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,16,power_law_1.2,0.6323071956634522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,2,balanced,1.799605369567871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,2,balanced,1.8002026875813801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,2,power_law_1.01,1.992665672302246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,2,power_law_1.01,2.0285696029663085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,2,power_law_1.2,2.135001564025879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,2,power_law_1.2,2.144063949584961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,256,balanced,0.3492213487625122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,256,balanced,0.35048532485961914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,256,power_law_1.01,0.37472000122070315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,256,power_law_1.01,0.37509760856628416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,256,power_law_1.2,0.39236481189727784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,256,power_law_1.2,0.39295361042022703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,32,balanced,0.4281653165817261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,32,balanced,0.4287039836247762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,32,power_law_1.01,0.49146881103515627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,32,power_law_1.01,0.4960127830505371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,32,power_law_1.2,0.4945024013519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,32,power_law_1.2,0.5208511829376221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,4,balanced,1.0756853421529133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,4,balanced,1.0776906808217366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,4,power_law_1.01,1.197977638244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,4,power_law_1.01,1.204371166229248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,4,power_law_1.2,1.2572735786437987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,4,power_law_1.2,1.284601593017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,64,balanced,0.3796000083287557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,64,balanced,0.37966398398081463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,64,power_law_1.01,0.42408318519592286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,64,power_law_1.01,0.4254271984100342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,64,power_law_1.2,0.4507199764251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,64,power_law_1.2,0.45733118057250977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,8,balanced,0.6949813365936279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,8,balanced,0.6950506369272867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,8,power_law_1.01,0.8179583549499512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,8,power_law_1.01,0.822054386138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,8,power_law_1.2,0.8401151657104492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,1,8,power_law_1.2,0.8700799942016602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,16,1,balanced,0.4905279874801636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,16,1,balanced,0.492085337638855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,16,1,power_law_1.01,0.569158411026001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,16,1,power_law_1.01,0.5701888084411622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,16,1,power_law_1.2,0.578227186203003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,16,1,power_law_1.2,0.5808063983917237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,2,1,balanced,1.7382346789042156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,2,1,balanced,1.740074634552002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,2,1,power_law_1.01,1.9254720687866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,2,1,power_law_1.01,1.9478271484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,2,1,power_law_1.2,2.0402944564819334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,2,1,power_law_1.2,2.04400634765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,4,1,balanced,0.9811733563741049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,4,1,balanced,0.9817173480987549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,4,1,power_law_1.01,1.1167936325073242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,4,1,power_law_1.01,1.1204480171203612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,4,1,power_law_1.2,1.145024013519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,4,1,power_law_1.2,1.1490816116333007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,8,1,balanced,0.5342080195744833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,8,1,balanced,0.5365920066833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,8,1,power_law_1.01,0.6350527763366699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,8,1,power_law_1.01,0.636185598373413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,8,1,power_law_1.2,0.6596288204193115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,256,8,1,power_law_1.2,0.6600639820098877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,1,balanced,4.689632097880046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,1,balanced,4.693098704020183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,1,power_law_1.01,4.575699234008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,1,power_law_1.01,4.650009536743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,1,power_law_1.2,4.62053108215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,1,power_law_1.2,4.788115310668945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,128,balanced,0.42231468359629315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,128,balanced,0.4225493272145589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,128,power_law_1.01,0.4414656162261963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,128,power_law_1.01,0.4516736030578613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,128,power_law_1.2,0.45841279029846194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,128,power_law_1.2,0.46372480392456056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,16,balanced,0.6662986675898234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,16,balanced,0.6683626969655355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,16,power_law_1.01,0.6890687942504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,16,power_law_1.01,0.7098176002502441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,16,power_law_1.2,0.731379222869873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,16,power_law_1.2,0.7322559833526612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,2,balanced,2.5614773432413735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,2,balanced,2.5614879926045737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,2,power_law_1.01,2.4649152755737305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,2,power_law_1.01,2.5852287292480467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,2,power_law_1.2,2.5770687103271483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,2,power_law_1.2,2.631353569030762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,32,balanced,0.531274676322937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,32,balanced,0.5315253337224325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,32,power_law_1.01,0.5544767856597901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,32,power_law_1.01,0.5618624210357666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,32,power_law_1.2,0.5680511951446533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,32,power_law_1.2,0.5769919872283935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,4,balanced,1.4816160202026367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,4,balanced,1.4852213859558105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,4,power_law_1.01,1.4594112396240235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,4,power_law_1.01,1.5147456169128417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,4,power_law_1.2,1.5371007919311523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,4,power_law_1.2,1.5392512321472167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,64,balanced,0.45590933163960773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,64,balanced,0.4586879809697469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,64,power_law_1.01,0.4816319942474365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,64,power_law_1.01,0.49132161140441893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,64,power_law_1.2,0.499724817276001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,64,power_law_1.2,0.5052159786224365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,8,balanced,0.9435466925303141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,8,balanced,0.9447200298309326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,8,power_law_1.01,0.9446975708007812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,8,power_law_1.01,0.9477184295654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,8,power_law_1.2,0.9886655807495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,1,8,power_law_1.2,1.0317503929138183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,16,1,balanced,0.466048002243042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,16,1,balanced,0.46672534942626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,16,1,power_law_1.01,0.529529619216919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,16,1,power_law_1.01,0.5335936069488525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,16,1,power_law_1.2,0.5361472129821777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,16,1,power_law_1.2,0.5539711952209473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,2,1,balanced,2.5099679629007974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,2,1,balanced,2.512117385864258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,2,1,power_law_1.01,2.4417152404785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,2,1,power_law_1.01,2.4513151168823244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,2,1,power_law_1.2,2.5343296051025392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,2,1,power_law_1.2,2.6011775970458983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,4,1,balanced,1.457680066426595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,4,1,balanced,1.4577600161234539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,4,1,power_law_1.01,1.409830379486084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,4,1,power_law_1.01,1.4232768058776855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,4,1,power_law_1.2,1.4478591918945312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,4,1,power_law_1.2,1.4774080276489259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,8,1,balanced,0.6682453155517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,8,1,balanced,0.6699573198954264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,8,1,power_law_1.01,0.7643904209136962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,8,1,power_law_1.01,0.770911979675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,8,1,power_law_1.2,0.7892032146453858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1024,7168,2048,8,384,8,1,power_law_1.2,0.7904128074645996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,1,balanced,2.4373440742492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,1,balanced,2.438927968343099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,1,power_law_1.01,2.4207231521606447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,1,power_law_1.01,2.4215103149414063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,1,power_law_1.2,2.426399993896484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,1,power_law_1.2,2.4298240661621096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,128,balanced,0.9121332963307699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,128,balanced,0.916053295135498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,128,power_law_1.01,1.009708786010742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,128,power_law_1.01,1.0141695976257323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,128,power_law_1.2,1.093344020843506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,128,power_law_1.2,1.1010560035705566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,16,balanced,1.011562665303548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,16,balanced,1.0127253532409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,16,power_law_1.01,1.1477248191833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,16,power_law_1.01,1.205446434020996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,16,power_law_1.2,1.2392000198364257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,16,power_law_1.2,1.2764991760253905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,2,balanced,1.7653706868489583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,2,balanced,1.768448034922282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,2,power_law_1.01,1.8071935653686524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,2,power_law_1.01,1.8895488739013673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,2,power_law_1.2,1.9210496902465821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,2,power_law_1.2,1.9307392120361329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,32,balanced,0.9567626317342123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,32,balanced,0.9569013118743896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,32,power_law_1.01,1.0749759674072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,32,power_law_1.01,1.0813376426696777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,32,power_law_1.2,1.1505279541015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,32,power_law_1.2,1.1551168441772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,4,balanced,1.3353333473205566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,4,balanced,1.3359306653340657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,4,power_law_1.01,1.4516736030578614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,4,power_law_1.01,1.498419189453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,4,power_law_1.2,1.5126848220825195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,4,power_law_1.2,1.5446784019470214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,64,balanced,0.9281973044077555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,64,balanced,0.9307200113932291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,64,power_law_1.01,1.023852825164795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,64,power_law_1.01,1.0668224334716796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,64,power_law_1.2,1.1375743865966796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,64,power_law_1.2,1.1641535758972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,8,balanced,1.1202133496602376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,8,balanced,1.1206666628519695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,8,power_law_1.01,1.1841919898986817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,8,power_law_1.01,1.254259204864502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,8,power_law_1.2,1.2651647567749023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,1,8,power_law_1.2,1.2988096237182618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,2,1,balanced,1.5006027221679688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,2,1,balanced,1.5010879834493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,2,1,power_law_1.01,1.5126976013183593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,2,1,power_law_1.01,1.5132287979125976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,2,1,power_law_1.2,1.5127039909362794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,2048,768,8,128,2,1,power_law_1.2,1.5150976181030273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,1,balanced,6.2986399332682295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,1,power_law_1.01,6.462361907958984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,1,power_law_1.01,6.484678649902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,1,power_law_1.2,6.433708953857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,1,power_law_1.2,6.46390380859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,128,balanced,1.5197332700093586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,128,balanced,1.519968032836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,128,power_law_1.01,1.69117431640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,128,power_law_1.01,1.7304895401000977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,128,power_law_1.2,1.9116544723510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,128,power_law_1.2,1.9443647384643554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,16,balanced,1.7944374084472656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,16,balanced,1.7971359888712566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,16,power_law_1.01,2.0448640823364257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,16,power_law_1.01,2.071500778198242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,16,power_law_1.2,2.1731840133666993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,16,power_law_1.2,2.2466815948486327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,2,balanced,3.97867743174235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,2,balanced,3.983658790588379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,2,power_law_1.01,4.320755386352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,2,power_law_1.01,4.326323318481445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,2,power_law_1.2,4.2950080871582035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,2,power_law_1.2,4.39288330078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,256,balanced,1.4953014055887859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,256,balanced,1.4990720748901367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,256,power_law_1.01,1.639334487915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,256,power_law_1.01,1.6481151580810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,256,power_law_1.2,1.8033344268798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,256,power_law_1.2,1.825984001159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,32,balanced,1.6380906105041504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,32,balanced,1.63919464747111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,32,power_law_1.01,1.8666175842285155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,32,power_law_1.01,1.9021696090698241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,32,power_law_1.2,2.0537343978881837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,32,power_law_1.2,2.0916223526000977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,4,balanced,2.7349812189737954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,4,balanced,2.7370773951212564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,4,power_law_1.01,2.9913152694702148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,4,power_law_1.01,3.044256019592285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,4,power_law_1.2,3.264614486694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,4,power_law_1.2,3.3487167358398438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,64,balanced,1.560149351755778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,64,balanced,1.5628320376078289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,64,power_law_1.01,1.7551935195922852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,64,power_law_1.01,1.7953407287597656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,64,power_law_1.2,1.8641216278076171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,64,power_law_1.2,1.9439615249633788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,8,balanced,2.108405272165934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,8,balanced,2.110703945159912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,8,power_law_1.01,2.386720085144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,8,power_law_1.01,2.4359552383422853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,8,power_law_1.2,2.6186752319335938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,1,8,power_law_1.2,2.6363199234008787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,2,1,balanced,3.583866755167643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,2,1,balanced,3.5840587615966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,2,1,power_law_1.01,3.664281463623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,2,1,power_law_1.01,3.670278549194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,2,1,power_law_1.2,3.647743988037109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,2,1,power_law_1.2,3.654694366455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,4,1,balanced,2.2116266886393228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,4,1,balanced,2.2143680254618325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,4,1,power_law_1.01,2.267852783203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,4,1,power_law_1.01,2.270457649230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,4,1,power_law_1.2,2.261894416809082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,3072,1536,8,256,4,1,power_law_1.2,2.2691200256347654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,1,balanced,16.075220743815105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,1,balanced,16.13641103108724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,1,power_law_1.01,16.218841552734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,1,power_law_1.01,16.254725646972656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,1,power_law_1.2,16.199757385253907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,1,power_law_1.2,16.213055419921876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,2,balanced,9.282639821370443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,2,balanced,9.292282740275065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,2,power_law_1.01,10.987174224853515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,2,power_law_1.01,11.635065460205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,2,power_law_1.2,11.503449249267579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,2,power_law_1.2,14.283500671386719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,4,balanced,5.88926378885905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,4,balanced,5.8961976369222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,4,power_law_1.01,9.317254638671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,4,power_law_1.01,9.67681884765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,4,power_law_1.2,9.550911712646485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,4,power_law_1.2,9.659942626953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,8,balanced,4.182101249694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,8,balanced,4.182991981506348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,8,power_law_1.01,8.430777740478515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,8,power_law_1.01,8.83007354736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,8,power_law_1.2,9.030009460449218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,1,8,power_law_1.2,9.218489837646484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,16,1,balanced,1.2767893473307292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,16,1,balanced,1.281274636586507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,16,1,power_law_1.01,1.273964786529541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,16,1,power_law_1.01,1.2821056365966796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,16,1,power_law_1.2,1.2747072219848632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,16,1,power_law_1.2,1.2765439987182616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,2,1,balanced,8.031781514485678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,2,1,balanced,8.035184224446615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,2,1,power_law_1.01,8.07519989013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,2,1,power_law_1.01,8.0840576171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,2,1,power_law_1.2,8.049542236328126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,2,1,power_law_1.2,8.079615783691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,4,1,balanced,4.139631907145183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,4,1,balanced,4.145824114481608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,4,1,power_law_1.01,4.101849746704102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,4,1,power_law_1.01,4.1052734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,4,1,power_law_1.2,4.1057281494140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,4,1,power_law_1.2,4.124256134033203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,8,1,balanced,2.197333335876465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,8,1,balanced,2.20470396677653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,8,1,power_law_1.01,2.1786048889160154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,8,1,power_law_1.01,2.188262367248535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,8,1,power_law_1.2,2.168704032897949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,14336,2,8,8,1,power_law_1.2,2.1838848114013674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,1,balanced,7.76254399617513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,1,balanced,7.773216247558594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,1,power_law_1.01,7.657017517089844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,1,power_law_1.01,7.675936126708985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,1,power_law_1.2,7.586048126220703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,1,power_law_1.2,7.606259155273437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,128,balanced,1.6897013982137044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,128,balanced,1.6933919588724773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,128,power_law_1.01,2.028121566772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,128,power_law_1.01,2.0481983184814454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,128,power_law_1.2,2.346099281311035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,128,power_law_1.2,2.3492864608764648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,16,balanced,2.041600068410238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,16,balanced,2.044282595316569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,16,power_law_1.01,2.4984960556030273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,16,power_law_1.01,2.622105598449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,16,power_law_1.2,2.6935871124267576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,16,power_law_1.2,2.8139135360717775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,2,balanced,4.826880137125651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,2,balanced,4.82806396484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,2,power_law_1.01,4.907884979248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,2,power_law_1.01,5.134540939331055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,2,power_law_1.2,5.049369430541992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,2,power_law_1.2,5.29054069519043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,32,balanced,1.8406133651733398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,32,balanced,1.8462880452473958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,32,power_law_1.01,2.2304000854492188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,32,power_law_1.01,2.261971282958984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,32,power_law_1.2,2.463641548156738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,32,power_law_1.2,2.620979118347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,4,balanced,3.239013353983561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,4,balanced,3.2437121073404946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,4,power_law_1.01,3.7301441192626954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,4,power_law_1.01,3.748896026611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,4,power_law_1.2,3.8147903442382813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,4,power_law_1.2,4.112473678588867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,64,balanced,1.7412427266438801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,64,balanced,1.7457440694173176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,64,power_law_1.01,2.1334463119506837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,64,power_law_1.01,2.2326528549194338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,64,power_law_1.2,2.3665151596069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,64,power_law_1.2,2.386387252807617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,8,balanced,2.441354592641195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,8,balanced,2.443514664967855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,8,power_law_1.01,2.914291191101074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,8,power_law_1.01,3.063340759277344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,8,power_law_1.2,3.0144256591796874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,1,8,power_law_1.2,3.2358463287353514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,2,1,balanced,4.327162742614746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,2,1,balanced,4.33293342590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,2,1,power_law_1.01,4.278047943115235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,2,1,power_law_1.01,4.282112121582031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,2,1,power_law_1.2,4.269318389892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,2,1,power_law_1.2,4.272032165527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,4,1,balanced,2.6920105616251626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,4,1,balanced,2.6932481129964194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,4,1,power_law_1.01,2.6982143402099608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,4,1,power_law_1.01,2.699942398071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,4,1,power_law_1.2,2.6926143646240233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,1536,8,128,4,1,power_law_1.2,2.694060707092285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,1,balanced,38.45879364013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,1,balanced,38.469940185546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,1,power_law_1.01,36.867550659179685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,1,power_law_1.01,36.89818115234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,1,power_law_1.2,36.454202270507814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,1,power_law_1.2,36.467507934570314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,128,balanced,6.379306793212891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,128,balanced,6.387610753377278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,128,power_law_1.01,7.069100952148437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,128,power_law_1.01,7.082720184326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,128,power_law_1.2,7.7399169921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,128,power_law_1.2,7.838841247558594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,16,balanced,8.2008908589681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,16,balanced,8.214666366577148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,16,power_law_1.01,9.125997161865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,16,power_law_1.01,9.307462310791015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,16,power_law_1.2,10.027212524414063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,16,power_law_1.2,9.967520141601563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,2,balanced,22.626927693684895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,2,balanced,22.632069905598957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,2,power_law_1.01,22.53120574951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,2,power_law_1.01,22.561613464355467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,2,power_law_1.2,22.38988800048828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,2,power_law_1.2,22.6662841796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,256,balanced,6.24777094523112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,256,balanced,6.265984217325847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,256,power_law_1.01,6.918585968017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,256,power_law_1.01,6.959782409667969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,256,power_law_1.2,7.2555389404296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,256,power_law_1.2,7.462764739990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,32,balanced,7.159648259480794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,32,balanced,7.163007736206055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,32,power_law_1.01,8.200460815429688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,32,power_law_1.01,8.217523193359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,32,power_law_1.2,8.63175048828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,32,power_law_1.2,8.882592010498048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,4,balanced,14.39901860555013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,4,balanced,14.405919392903646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,4,power_law_1.01,14.965184020996094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,4,power_law_1.01,15.290643310546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,4,power_law_1.2,15.620851135253906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,4,power_law_1.2,15.749427795410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,64,balanced,6.6397705078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,64,balanced,6.66709836324056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,64,power_law_1.01,7.517977905273438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,64,power_law_1.01,7.748038482666016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,64,power_law_1.2,7.848127746582032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,64,power_law_1.2,8.280703735351562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,8,balanced,10.2816530863444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,8,balanced,10.30564816792806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,8,power_law_1.01,11.413107299804688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,8,power_law_1.01,11.45709457397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,8,power_law_1.2,12.031667327880859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,4096,2688,22,512,1,8,power_law_1.2,12.090777587890624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,1,balanced,26.125328063964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,1,balanced,26.130752563476562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,1,power_law_1.01,26.2237060546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,1,power_law_1.01,26.3046142578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,1,power_law_1.2,26.18184814453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,1,power_law_1.2,26.21895751953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,2,balanced,14.551675160725912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,2,balanced,14.554645538330078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,2,power_law_1.01,16.62476806640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,2,power_law_1.01,18.811013793945314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,2,power_law_1.2,18.525868225097657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,2,power_law_1.2,19.682879638671874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,4,balanced,8.674938837687174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,4,balanced,8.680309295654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,4,power_law_1.01,15.221133422851562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,4,power_law_1.01,18.618623352050783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,4,power_law_1.2,14.012825012207031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,4,power_law_1.2,15.301036071777343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,8,balanced,5.76470947265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,8,balanced,5.765647888183594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,8,power_law_1.01,13.186592102050781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,8,power_law_1.01,14.40997772216797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,8,power_law_1.2,14.2151611328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,1,8,power_law_1.2,14.395680236816407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,16,1,balanced,2.0357227325439453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,16,1,balanced,2.0392212867736816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,16,1,power_law_1.01,1.995564842224121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,16,1,power_law_1.01,2.003955268859863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,16,1,power_law_1.2,1.9993600845336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,16,1,power_law_1.2,1.9995712280273437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,2,1,balanced,13.017407735188803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,2,1,balanced,13.037775675455729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,2,1,power_law_1.01,13.100070190429687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,2,1,power_law_1.01,13.121849060058594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,2,1,power_law_1.2,13.068243408203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,2,1,power_law_1.2,13.100416564941407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,32,1,balanced,1.2916959921518962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,32,1,balanced,1.2926666736602783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,32,1,power_law_1.01,1.2719488143920898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,32,1,power_law_1.01,1.2772735595703124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,32,1,power_law_1.2,1.2799872398376464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,32,1,power_law_1.2,1.2827967643737792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,4,1,balanced,6.764261245727539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,4,1,balanced,6.765546798706055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,4,1,power_law_1.01,6.773388671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,4,1,power_law_1.01,6.777606201171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,4,1,power_law_1.2,6.738905334472657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,4,1,power_law_1.2,6.7696067810058596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,8,1,balanced,3.5928052266438804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,8,1,balanced,3.599365234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,8,1,power_law_1.01,3.5641407012939452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,8,1,power_law_1.01,3.5698753356933595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,8,1,power_law_1.2,3.5607936859130858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,16384,2,8,8,1,power_law_1.2,3.571724700927734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,1,balanced,14.817423502604166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,1,balanced,14.820485432942709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,1,power_law_1.01,15.671174621582031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,1,power_law_1.01,15.676742553710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,1,power_law_1.2,15.602963256835938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,1,power_law_1.2,15.64062042236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,128,balanced,2.429525375366211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,128,balanced,2.4365545908610025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,128,power_law_1.01,2.9404735565185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,128,power_law_1.01,2.9416704177856445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,128,power_law_1.2,3.2833023071289062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,128,power_law_1.2,3.327187347412109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,16,balanced,3.1380958557128906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,16,balanced,3.150752067565918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,16,power_law_1.01,3.826860809326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,16,power_law_1.01,3.9224510192871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,16,power_law_1.2,4.188313674926758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,16,power_law_1.2,4.307814407348633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,2,balanced,8.751829147338867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,2,balanced,8.75387191772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,2,power_law_1.01,9.689401245117187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,2,power_law_1.01,9.863897705078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,2,power_law_1.2,10.12652816772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,2,power_law_1.2,9.4770751953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,256,balanced,2.3785759607950845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,256,balanced,2.3793066342671714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,256,power_law_1.01,2.7503103256225585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,256,power_law_1.01,2.7680959701538086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,256,power_law_1.2,3.1947776794433596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,256,power_law_1.2,3.2898048400878905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,32,balanced,2.7362613677978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,32,balanced,2.736271858215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,32,power_law_1.01,3.258854293823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,32,power_law_1.01,3.342310333251953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,32,power_law_1.2,3.831180953979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,32,power_law_1.2,3.864479827880859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,4,balanced,5.55897585550944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,4,balanced,5.565717061360677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,4,power_law_1.01,6.401248168945313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,4,power_law_1.01,6.743929290771485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,4,power_law_1.2,6.688825225830078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,4,power_law_1.2,7.071174621582031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,64,balanced,2.5323840777079263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,64,balanced,2.5376052856445312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,64,power_law_1.01,3.1648832321166993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,64,power_law_1.01,3.2348289489746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,64,power_law_1.2,3.252409744262695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,64,power_law_1.2,3.4973567962646483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,8,balanced,3.765322685241699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,8,balanced,3.7653331756591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,8,power_law_1.01,4.676422500610352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,8,power_law_1.01,4.727884674072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,8,power_law_1.2,5.049190521240234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,1,8,power_law_1.2,5.477215957641602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,16,1,balanced,2.501413345336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,16,1,balanced,2.502432028452555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,16,1,power_law_1.01,2.5760320663452148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,16,1,power_law_1.01,2.5764095306396486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,16,1,power_law_1.2,2.572902488708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,16,1,power_law_1.2,2.5767040252685547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,2,1,balanced,8.148010889689127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,2,1,balanced,8.15390396118164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,2,1,power_law_1.01,8.521376037597657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,2,1,power_law_1.01,8.530982208251952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,2,1,power_law_1.2,8.429523468017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,2,1,power_law_1.2,8.449798583984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,4,1,balanced,4.713818550109863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,4,1,balanced,4.716400146484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,4,1,power_law_1.01,4.957299041748047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,4,1,power_law_1.01,4.9628032684326175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,4,1,power_law_1.2,4.996211242675781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,4,1,power_law_1.2,5.002182388305664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,8,1,balanced,6.488047917683919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,8,1,balanced,6.493029276529948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,8,1,power_law_1.01,6.615711975097656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,8,1,power_law_1.01,6.624050903320312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,8,1,power_law_1.2,6.639180755615234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2048,8,256,8,1,power_law_1.2,6.65323486328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,1,balanced,18.515722910563152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,1,balanced,18.534693400065105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,1,power_law_1.01,18.275648498535155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,1,power_law_1.01,18.36201629638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,1,power_law_1.2,18.21386260986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,1,power_law_1.2,18.231085205078124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,16,balanced,3.5950988133748374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,16,balanced,3.6035305658976235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,16,power_law_1.01,4.500102233886719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,16,power_law_1.01,4.947206497192383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,16,power_law_1.2,5.026163101196289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,16,power_law_1.2,5.4977470397949215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,2,balanced,10.723082224527994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,2,balanced,10.72601572672526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,2,power_law_1.01,11.403775787353515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,2,power_law_1.01,11.505856323242188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,2,power_law_1.2,11.722541046142577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,2,power_law_1.2,11.75937271118164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,32,balanced,3.0759201049804688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,32,balanced,3.077184041341146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,32,power_law_1.01,3.847391891479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,32,power_law_1.01,4.148774337768555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,32,power_law_1.2,4.412108612060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,32,power_law_1.2,5.256313705444336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,4,balanced,6.325157165527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,4,balanced,6.32864507039388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,4,power_law_1.01,7.473458862304687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,4,power_law_1.01,7.809785461425781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,4,power_law_1.2,7.940576171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,4,power_law_1.2,8.62332763671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,8,balanced,4.438901265462239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,8,balanced,4.4422346750895185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,8,power_law_1.01,5.533497619628906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,8,power_law_1.01,5.650374221801758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,8,power_law_1.2,5.494547271728516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,1,8,power_law_1.2,6.26624641418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,2,1,balanced,10.02346102396647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,2,1,balanced,10.024837493896484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,2,1,power_law_1.01,9.774700927734376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,2,1,power_law_1.01,9.779910278320312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,2,1,power_law_1.2,9.627565002441406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,2,1,power_law_1.2,9.687129974365234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,4,1,balanced,5.647290547688802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,4,1,balanced,5.64799435933431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,4,1,power_law_1.01,5.505708694458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,4,1,power_law_1.01,5.5170238494873045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,4,1,power_law_1.2,5.502912139892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,6144,2560,8,160,4,1,power_law_1.2,5.510611343383789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,1,balanced,17.071136474609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,1,balanced,17.080426534016926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,1,power_law_1.01,18.086213684082033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,1,power_law_1.01,18.13690948486328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,1,power_law_1.2,18.040127563476563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,1,power_law_1.2,18.193209838867187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,128,balanced,2.6341867446899414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,128,balanced,2.6386292775472007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,128,power_law_1.01,3.2387649536132814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,128,power_law_1.01,3.294707107543945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,128,power_law_1.2,3.7135551452636717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,128,power_law_1.2,3.7520000457763674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,16,balanced,3.4705918629964194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,16,balanced,3.471520105997721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,16,power_law_1.01,4.415507125854492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,16,power_law_1.01,4.452070236206055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,16,power_law_1.2,4.61011848449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,16,power_law_1.2,4.957766342163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,2,balanced,10.019845326741537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,2,balanced,10.037354787190756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,2,power_law_1.01,11.268422698974609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,2,power_law_1.01,11.486137390136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,2,power_law_1.2,11.03692169189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,2,power_law_1.2,12.013970947265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,256,balanced,2.5736160278320312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,256,balanced,2.578762690226237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,256,power_law_1.01,2.983667182922363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,256,power_law_1.01,3.0205312728881837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,256,power_law_1.2,3.536326217651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,256,power_law_1.2,3.601446533203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,32,balanced,2.99942938486735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,32,balanced,3.000581423441569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,32,power_law_1.01,3.717452621459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,32,power_law_1.01,3.859436798095703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,32,power_law_1.2,3.9007488250732423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,32,power_law_1.2,4.3573760986328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,4,balanced,6.28982416788737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,4,balanced,6.299039840698242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,4,power_law_1.01,7.430111694335937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,4,power_law_1.01,7.430419158935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,4,power_law_1.2,7.7837059020996096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,4,power_law_1.2,7.843513488769531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,64,balanced,2.7540105183919272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,64,balanced,2.7633066177368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,64,power_law_1.01,3.3432064056396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,64,power_law_1.01,3.485228729248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,64,power_law_1.2,3.9634559631347654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,64,power_law_1.2,3.9694400787353517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,8,balanced,4.242159843444824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,8,balanced,4.244821230570476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,8,power_law_1.01,5.1159423828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,8,power_law_1.01,5.312825775146484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,8,power_law_1.2,5.896332931518555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,1,8,power_law_1.2,5.934963226318359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,16,1,balanced,2.8857173919677734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,16,1,balanced,2.887306531270345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,16,1,power_law_1.01,2.968671989440918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,16,1,power_law_1.01,2.9746368408203123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,16,1,power_law_1.2,2.974073600769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,16,1,power_law_1.2,2.9743679046630858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,2,1,balanced,9.429221471150717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,2,1,balanced,9.448853174845377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,2,1,power_law_1.01,9.872870635986327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,2,1,power_law_1.01,9.886771392822265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,2,1,power_law_1.2,9.803340911865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,2,1,power_law_1.2,9.84466552734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,4,1,balanced,5.418928146362305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,4,1,balanced,5.419823964436849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,4,1,power_law_1.01,5.704025650024414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,4,1,power_law_1.01,5.717491149902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,4,1,power_law_1.2,5.748211288452149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,4,1,power_law_1.2,5.7558849334716795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,8,1,balanced,7.53659184773763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,8,1,balanced,7.550687789916992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,8,1,power_law_1.01,7.7033027648925785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,8,1,power_law_1.01,7.711174774169922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,8,1,power_law_1.2,7.716851043701172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,256,8,1,power_law_1.2,7.734662628173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,1,balanced,17.41981379191081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,1,balanced,17.43221918741862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,1,power_law_1.01,19.215481567382813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,1,power_law_1.01,19.238156127929688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,1,power_law_1.2,19.377880859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,1,power_law_1.2,19.38588104248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,128,balanced,2.694239934285482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,128,balanced,2.6991732915242515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,128,power_law_1.01,3.1753984451293946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,128,power_law_1.01,3.1808448791503907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,128,power_law_1.2,3.4673023223876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,128,power_law_1.2,3.596108627319336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,16,balanced,3.53494930267334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,16,balanced,3.542266527811686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,16,power_law_1.01,4.282041549682617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,16,power_law_1.01,4.299859237670899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,16,power_law_1.2,4.6061248779296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,16,power_law_1.2,4.7710014343261715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,2,balanced,10.212607701619467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,2,balanced,10.218618392944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,2,power_law_1.01,11.518547058105469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,2,power_law_1.01,11.789292907714843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,2,power_law_1.2,11.509939575195313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,2,power_law_1.2,12.150579071044922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,32,balanced,3.062922795613607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,32,balanced,3.067098617553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,32,power_law_1.01,3.6184318542480467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,32,power_law_1.01,3.7720577239990236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,32,power_law_1.2,3.98682861328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,32,power_law_1.2,4.0025279998779295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,4,balanced,6.410928090413411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,4,balanced,6.425461451212565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,4,power_law_1.01,7.555046081542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,4,power_law_1.01,7.741747283935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,4,power_law_1.2,7.779788970947266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,4,power_law_1.2,7.908710479736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,64,balanced,2.811567942301432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,64,balanced,2.815802574157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,64,power_law_1.01,3.3170238494873048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,64,power_law_1.01,3.3355968475341795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,64,power_law_1.2,3.578937530517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,64,power_law_1.2,3.809203338623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,8,balanced,4.5024159749348955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,8,balanced,4.502762794494629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,8,power_law_1.01,5.650764846801758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,8,power_law_1.01,5.811616134643555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,8,power_law_1.2,5.656383895874024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,1,8,power_law_1.2,5.8816062927246096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,16,1,balanced,3.4878241221110025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,16,1,balanced,3.490528106689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,16,1,power_law_1.01,3.631961441040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,16,1,power_law_1.01,3.6347904205322266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,16,1,power_law_1.2,3.670444869995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,16,1,power_law_1.2,3.6829246520996093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,2,1,balanced,9.629583994547525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,2,1,balanced,9.639621098836264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,2,1,power_law_1.01,10.482169342041015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,2,1,power_law_1.01,10.516063690185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,2,1,power_law_1.2,10.502098846435548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,2,1,power_law_1.2,10.505702209472656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,4,1,balanced,5.8083038330078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,4,1,balanced,5.810997645060222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,4,1,power_law_1.01,6.141388702392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,4,1,power_law_1.01,6.160268783569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,4,1,power_law_1.2,6.136908721923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,4,1,power_law_1.2,6.171622467041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,8,1,balanced,3.8000427881876626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,8,1,balanced,3.8030878702799478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,8,1,power_law_1.01,4.046847915649414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,8,1,power_law_1.01,4.050457763671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,8,1,power_law_1.2,4.071724700927734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,12288,7168,2048,8,384,8,1,power_law_1.2,4.0855873107910154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,1,balanced,0.14443199833234152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,1,balanced,0.144896000623703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,1,power_law_1.01,0.14043519496917725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,1,power_law_1.01,0.14111360311508178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,1,power_law_1.2,0.1434175968170166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,1,power_law_1.2,0.14696320295333862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,128,balanced,0.052815998593966164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,128,balanced,0.05346666773160299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,128,power_law_1.01,0.05127040147781372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,128,power_law_1.01,0.05137919783592224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,128,power_law_1.2,0.05119360089302063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,128,power_law_1.2,0.051532799005508424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,16,balanced,0.056986664732297264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,16,balanced,0.059621334075927734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,16,power_law_1.01,0.05676800012588501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,16,power_law_1.01,0.05777919888496399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,16,power_law_1.2,0.05742719769477844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,16,power_law_1.2,0.0584447979927063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,2,balanced,0.1402186652024587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,2,balanced,0.1402773360411326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,2,power_law_1.01,0.13642239570617676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,2,power_law_1.01,0.13652479648590088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,2,power_law_1.2,0.1377344012260437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,2,power_law_1.2,0.1378559947013855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,32,balanced,0.05602666735649109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,32,balanced,0.056234667698542275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,32,power_law_1.01,0.05435519814491272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,32,power_law_1.01,0.055225598812103274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,32,power_law_1.2,0.05359359979629517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,32,power_law_1.2,0.05490559935569763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,4,balanced,0.10070400436719258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,4,balanced,0.1019040048122406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,4,power_law_1.01,0.09663360118865967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,4,power_law_1.01,0.09807360172271729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,4,power_law_1.2,0.09864959716796876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,4,power_law_1.2,0.09906560182571411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,64,balanced,0.05267733335494995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,64,balanced,0.05519466598828634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,64,power_law_1.01,0.05167359709739685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,64,power_law_1.01,0.05316479802131653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,64,power_law_1.2,0.05280640125274658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,64,power_law_1.2,0.053011202812194826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,8,balanced,0.06831466654936473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,8,balanced,0.06970133384068807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,8,power_law_1.01,0.06661120057106018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,8,power_law_1.01,0.06661760210990905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,8,power_law_1.2,0.0654911994934082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,1,8,power_law_1.2,0.06663680076599121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,2,1,balanced,0.10198932886123657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,2,1,balanced,0.10320533315340678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,2,1,power_law_1.01,0.10223360061645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,2,1,power_law_1.01,0.10235519409179687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,2,1,power_law_1.2,0.10354559421539307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,2048,768,8,128,2,1,power_law_1.2,0.10936959981918334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,1,balanced,1.0293333530426025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,1,balanced,1.030501365661621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,1,power_law_1.01,0.8608832359313965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,1,power_law_1.01,0.8697600364685059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,1,power_law_1.2,0.8576448440551758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,1,power_law_1.2,0.865932846069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,128,balanced,0.0995093286037445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,128,balanced,0.10047466556231181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,128,power_law_1.01,0.0986624002456665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,128,power_law_1.01,0.0992255985736847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,128,power_law_1.2,0.09923840165138245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,128,power_law_1.2,0.09926400184631348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,16,balanced,0.156549334526062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,16,balanced,0.15727466344833374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,16,power_law_1.01,0.15077760219573974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,16,power_law_1.01,0.1533568024635315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,16,power_law_1.2,0.14855040311813356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,16,power_law_1.2,0.15020159482955933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,2,balanced,0.5643786589304606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,2,balanced,0.5654933452606201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,2,power_law_1.01,0.4767168045043945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,2,power_law_1.01,0.49413118362426756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,2,power_law_1.2,0.47000322341918943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,2,power_law_1.2,0.48401918411254885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,256,balanced,0.09716266393661499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,256,balanced,0.09845866759618123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,256,power_law_1.01,0.09627519845962525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,256,power_law_1.01,0.09667199850082397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,256,power_law_1.2,0.0967296004295349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,256,power_law_1.2,0.09696000218391418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,32,balanced,0.12588799993197122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,32,balanced,0.1269706686337789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,32,power_law_1.01,0.12062720060348511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,32,power_law_1.01,0.12275199890136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,32,power_law_1.2,0.11927039623260498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,32,power_law_1.2,0.12275199890136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,4,balanced,0.3367520173390706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,4,balanced,0.3368693192799886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,4,power_law_1.01,0.2866624116897583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,4,power_law_1.01,0.2877631902694702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,4,power_law_1.2,0.299782395362854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,4,power_law_1.2,0.3023551940917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,64,balanced,0.1072160005569458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,64,balanced,0.10773866375287373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,64,power_law_1.01,0.10403200387954711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,64,power_law_1.01,0.1047104001045227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,64,power_law_1.2,0.10323200225830079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,64,power_law_1.2,0.10436480045318604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,8,balanced,0.21778666973114014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,8,balanced,0.21804799636205038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,8,power_law_1.01,0.19969919919967652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,8,power_law_1.01,0.20072319507598876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,8,power_law_1.2,0.20152320861816406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,1,8,power_law_1.2,0.20658559799194337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,2,1,balanced,0.5751466751098633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,2,1,balanced,0.5764853159586588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,2,1,power_law_1.01,0.4779839992523193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,2,1,power_law_1.01,0.48226561546325686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,2,1,power_law_1.2,0.47842559814453123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,2,1,power_law_1.2,0.4854400157928467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,4,1,balanced,0.3485066493352254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,4,1,balanced,0.34856534004211426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,4,1,power_law_1.01,0.29738240242004393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,4,1,power_law_1.01,0.29808640480041504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,4,1,power_law_1.2,0.2975231885910034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,3072,1536,8,256,4,1,power_law_1.2,0.2996543884277344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,1,balanced,0.45668800671895343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,1,balanced,0.4590080181757609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,1,power_law_1.01,0.5175936222076416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,1,power_law_1.01,0.543839979171753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,1,power_law_1.2,0.48932480812072754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,1,power_law_1.2,0.4905344009399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,2,balanced,0.3302560051282247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,2,balanced,0.3316533366839091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,2,power_law_1.01,0.3486464023590088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,2,power_law_1.01,0.3518208026885986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,2,power_law_1.2,0.3378304004669189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,2,power_law_1.2,0.3463551998138428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,4,balanced,0.25781333446502686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,4,balanced,0.25909332434336346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,4,power_law_1.01,0.2811647891998291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,4,power_law_1.01,0.2888128042221069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,4,power_law_1.2,0.2883008003234863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,4,power_law_1.2,0.2890752077102661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,8,balanced,0.22637333472569784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,8,balanced,0.22712000211079916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,8,power_law_1.01,0.2492288112640381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,8,power_law_1.01,0.24976639747619628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,8,power_law_1.2,0.24885120391845703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,1,8,power_law_1.2,0.24992001056671143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,16,1,balanced,0.07426133255163829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,16,1,balanced,0.07709333300590515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,16,1,power_law_1.01,0.07795199751853943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,16,1,power_law_1.01,0.07797120213508606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,16,1,power_law_1.2,0.07768959999084472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,16,1,power_law_1.2,0.07908480167388916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,2,1,balanced,0.2614453236262004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,2,1,balanced,0.2627679904301961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,2,1,power_law_1.01,0.28309121131896975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,2,1,power_law_1.01,0.2952320098876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,2,1,power_law_1.2,0.26115200519561765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,2,1,power_law_1.2,0.2840512037277222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,4,1,balanced,0.1481760044892629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,4,1,balanced,0.15236266454060873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,4,1,power_law_1.01,0.15804799795150756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,4,1,power_law_1.01,0.15827200412750245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,4,1,power_law_1.2,0.1543552041053772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,4,1,power_law_1.2,0.15892479419708253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,8,1,balanced,0.09027199943860371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,8,1,balanced,0.09289066990216573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,8,1,power_law_1.01,0.09370239973068237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,8,1,power_law_1.01,0.09566079974174499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,8,1,power_law_1.2,0.09631999731063842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,14336,2,8,8,1,power_law_1.2,0.0991807997226715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,1,balanced,0.7057759761810303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,1,balanced,0.7073493003845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,1,power_law_1.01,0.6613376140594482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,1,power_law_1.01,0.6637951850891113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,1,power_law_1.2,0.6612415790557862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,1,power_law_1.2,0.6700607776641846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,128,balanced,0.08071466783682506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,128,balanced,0.08277866741021474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,128,power_law_1.01,0.07899519801139832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,128,power_law_1.01,0.07994880080223084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,128,power_law_1.2,0.07906559705734253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,128,power_law_1.2,0.08145279884338379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,16,balanced,0.1163146694501241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,16,balanced,0.11652266979217529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,16,power_law_1.01,0.1129472017288208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,16,power_law_1.01,0.11386239528656006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,16,power_law_1.2,0.11450239419937133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,16,power_law_1.2,0.1146239995956421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,2,balanced,0.40520532925923664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,2,balanced,0.4053279956181844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,2,power_law_1.01,0.37223680019378663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,2,power_law_1.01,0.3752448081970215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,2,power_law_1.2,0.37881600856781006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,2,power_law_1.2,0.37994239330291746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,32,balanced,0.10254933436711629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,32,balanced,0.10461866855621338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,32,power_law_1.01,0.10074880123138427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,32,power_law_1.01,0.10085120201110839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,32,power_law_1.2,0.10231679677963257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,32,power_law_1.2,0.10282880067825317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,4,balanced,0.23636800050735474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,4,balanced,0.23676800727844238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,4,power_law_1.01,0.22986240386962892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,4,power_law_1.01,0.23114240169525146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,4,power_law_1.2,0.23138558864593506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,4,power_law_1.2,0.23352959156036376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,64,balanced,0.08614400029182434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,64,balanced,0.08889066179593404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,64,power_law_1.01,0.08925439715385437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,64,power_law_1.01,0.09070720076560974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,64,power_law_1.2,0.08790400028228759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,64,power_law_1.2,0.08940160274505615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,8,balanced,0.16458666324615479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,8,balanced,0.16500799854596457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,8,power_law_1.01,0.16174720525741576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,8,power_law_1.01,0.163046395778656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,8,power_law_1.2,0.15383039712905883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,1,8,power_law_1.2,0.16227200031280517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,2,1,balanced,0.2437280019124349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,2,1,balanced,0.24474134047826132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,2,1,power_law_1.01,0.24495360851287842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,2,1,power_law_1.01,0.2475584030151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,2,1,power_law_1.2,0.24971520900726318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,2,1,power_law_1.2,0.25358080863952637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,4,1,balanced,0.1632426679134369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,4,1,balanced,0.16369066635767618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,4,1,power_law_1.01,0.16407040357589722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,4,1,power_law_1.01,0.17132799625396727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,4,1,power_law_1.2,0.1751039981842041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,1536,8,128,4,1,power_law_1.2,0.17776000499725342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,1,balanced,4.450079917907715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,1,balanced,4.450474739074707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,1,power_law_1.01,3.890214538574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,1,power_law_1.01,3.9336574554443358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,1,power_law_1.2,3.988505554199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,1,power_law_1.2,3.990630340576172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,128,balanced,0.29980266094207764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,128,balanced,0.3003999988238017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,128,power_law_1.01,0.29567999839782716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,128,power_law_1.01,0.2993664026260376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,128,power_law_1.2,0.29701120853424073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,128,power_law_1.2,0.2981120109558105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,16,balanced,0.541370670000712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,16,balanced,0.5434933503468832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,16,power_law_1.01,0.5156544208526611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,16,power_law_1.01,0.5191359996795655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,16,power_law_1.2,0.5204288005828858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,16,power_law_1.2,0.5248383998870849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,2,balanced,2.369119962056478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,2,balanced,2.3712053298950195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,2,power_law_1.01,2.075379180908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,2,power_law_1.01,2.154278373718262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,2,power_law_1.2,2.1293567657470702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,2,power_law_1.2,2.1736064910888673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,256,balanced,0.2828373312950134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,256,balanced,0.2852320075035095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,256,power_law_1.01,0.2813888072967529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,256,power_law_1.01,0.28222720623016356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,256,power_law_1.2,0.2829375982284546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,256,power_law_1.2,0.2829567909240723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,32,balanced,0.40617601076761883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,32,balanced,0.4062346617380778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,32,power_law_1.01,0.39159679412841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,32,power_law_1.01,0.3932543992996216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,32,power_law_1.2,0.39574398994445803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,32,power_law_1.2,0.39660799503326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,4,balanced,1.3296639919281006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,4,balanced,1.3319413661956787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,4,power_law_1.01,1.1865856170654296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,4,power_law_1.01,1.2447360038757325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,4,power_law_1.2,1.1893823623657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,4,power_law_1.2,1.229139232635498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,64,balanced,0.3391093413035075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,64,balanced,0.3407573302586873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,64,power_law_1.01,0.32956159114837646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,64,power_law_1.01,0.3360896110534668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,64,power_law_1.2,0.3326591968536377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,64,power_law_1.2,0.33466880321502684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,8,balanced,0.8090453147888184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,8,balanced,0.8112106323242188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,8,power_law_1.01,0.7426688194274902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,8,power_law_1.01,0.7611775875091553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,8,power_law_1.2,0.7309055805206299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,4096,2688,22,512,1,8,power_law_1.2,0.7494592189788818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,1,balanced,0.768666664759318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,1,balanced,0.7698240280151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,1,power_law_1.01,0.8212287902832032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,1,power_law_1.01,0.8395456314086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,1,power_law_1.2,0.8297792434692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,1,power_law_1.2,0.8399552345275879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,2,balanced,0.4438186486562093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,2,balanced,0.4442933400472005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,2,power_law_1.01,0.48998398780822755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,2,power_law_1.01,0.49103360176086425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,2,power_law_1.2,0.49054718017578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,2,power_law_1.2,0.5094592094421386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,4,balanced,0.3286293347676595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,4,balanced,0.32898133993148804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,4,power_law_1.01,0.3650304079055786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,4,power_law_1.01,0.37260799407958983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,4,power_law_1.2,0.37249279022216797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,4,power_law_1.2,0.3816256046295166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,8,balanced,0.2755840023358663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,8,balanced,0.2763306697209676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,8,power_law_1.01,0.3144448041915894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,8,power_law_1.01,0.31484160423278806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,8,power_law_1.2,0.30536959171295164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,1,8,power_law_1.2,0.31629440784454343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,16,1,balanced,0.11020267009735107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,16,1,balanced,0.11170132954915364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,16,1,power_law_1.01,0.10888960361480712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,16,1,power_law_1.01,0.10926079750061035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,16,1,power_law_1.2,0.10894720554351807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,16,1,power_law_1.2,0.10966399908065796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,2,1,balanced,0.4259573221206665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,2,1,balanced,0.4268426497777303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,2,1,power_law_1.01,0.4416192054748535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,2,1,power_law_1.01,0.45016961097717284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,2,1,power_law_1.2,0.42525439262390136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,2,1,power_law_1.2,0.43374080657958985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,32,1,balanced,0.0911253293355306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,32,1,balanced,0.09237333138783772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,32,1,power_law_1.01,0.09044479727745056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,32,1,power_law_1.01,0.09153280258178711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,32,1,power_law_1.2,0.09072639942169189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,32,1,power_law_1.2,0.09201279878616334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,4,1,balanced,0.23293334245681763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,4,1,balanced,0.25732799371083576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,4,1,power_law_1.01,0.24769279956817628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,4,1,power_law_1.01,0.24810879230499266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,4,1,power_law_1.2,0.24788479804992675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,4,1,power_law_1.2,0.26659839153289794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,8,1,balanced,0.1328426698843638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,8,1,balanced,0.13532800475756326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,8,1,power_law_1.01,0.16197119951248168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,8,1,power_law_1.01,0.16199040412902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,8,1,power_law_1.2,0.1334272027015686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,16384,2,8,8,1,power_law_1.2,0.1432255983352661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,1,balanced,2.547274589538574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,1,balanced,2.547968069712321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,1,power_law_1.01,2.0954111099243162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,1,power_law_1.01,2.1587839126586914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,1,power_law_1.2,2.0990976333618163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,1,power_law_1.2,2.112985610961914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,128,balanced,0.1686720053354899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,128,balanced,0.16993065675099692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,128,power_law_1.01,0.16584960222244263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,128,power_law_1.01,0.1670207977294922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,128,power_law_1.2,0.16570240259170532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,128,power_law_1.2,0.1664639949798584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,16,balanced,0.29542932907740277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,16,balanced,0.2981920043627421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,16,power_law_1.01,0.27832319736480715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,16,power_law_1.01,0.27939839363098146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,16,power_law_1.2,0.2663104057312012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,16,power_law_1.2,0.2802432060241699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,2,balanced,1.341418743133545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,2,balanced,1.3420799573262532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,2,power_law_1.01,1.1336704254150392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,2,power_law_1.01,1.171820831298828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,2,power_law_1.2,1.140492820739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,2,power_law_1.2,1.1471232414245605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,256,balanced,0.16196800271670023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,256,balanced,0.16249066591262817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,256,power_law_1.01,0.15229439735412598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,256,power_law_1.01,0.16120959520339967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,256,power_law_1.2,0.15313279628753662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,256,power_law_1.2,0.15459840297698973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,32,balanced,0.22245333592096964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,32,power_law_1.01,0.21458559036254882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,32,power_law_1.01,0.21553280353546142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,32,power_law_1.2,0.2163327932357788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,32,power_law_1.2,0.21834878921508788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,4,balanced,0.7521013418833414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,4,balanced,0.7529119650522867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,4,power_law_1.01,0.6596415996551513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,4,power_law_1.01,0.6616767883300781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,4,power_law_1.2,0.6186560153961181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,4,power_law_1.2,0.6444543838500977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,64,balanced,0.181002676486969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,64,balanced,0.18127999703089395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,64,power_law_1.01,0.175654399394989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,64,power_law_1.01,0.1798784017562866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,64,power_law_1.2,0.17431039810180665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,64,power_law_1.2,0.18002560138702392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,8,balanced,0.4429653485616048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,8,balanced,0.4431999921798706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,8,power_law_1.01,0.38863999843597413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,8,power_law_1.01,0.4177663803100586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,8,power_law_1.2,0.3899904012680054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,1,8,power_law_1.2,0.40140161514282224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,16,1,balanced,0.34329064687093097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,16,1,balanced,0.34426132837931317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,16,1,power_law_1.01,0.3139008045196533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,16,1,power_law_1.01,0.3188352108001709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,16,1,power_law_1.2,0.3136447906494141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,16,1,power_law_1.2,0.3145792007446289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,2,1,balanced,1.3545494079589844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,2,1,balanced,1.355397383371989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,2,1,power_law_1.01,1.1563263893127442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,2,1,power_law_1.01,1.1576128005981445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,2,1,power_law_1.2,1.145094394683838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,2,1,power_law_1.2,1.1518976211547851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,4,1,balanced,0.4638986587524414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,4,1,balanced,0.46477333704630536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,4,1,power_law_1.01,0.38075520992279055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,4,1,power_law_1.01,0.39702401161193845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,4,1,power_law_1.2,0.392249608039856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,4,1,power_law_1.2,0.40639362335205076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,8,1,balanced,0.29016000032424927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,8,1,balanced,0.29025065898895264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,8,1,power_law_1.01,0.25046401023864745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,8,1,power_law_1.01,0.2563904047012329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,8,1,power_law_1.2,0.25007359981536864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2048,8,256,8,1,power_law_1.2,0.25363199710845946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,1,balanced,2.014959971110026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,1,balanced,2.015450636545817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,1,power_law_1.01,1.7972671508789062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,1,power_law_1.01,1.8453184127807618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,1,power_law_1.2,1.86944637298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,1,power_law_1.2,1.8833087921142577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,16,balanced,0.24452267090479532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,16,balanced,0.245578666528066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,16,power_law_1.01,0.23740799427032472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,16,power_law_1.01,0.2420799970626831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,16,power_law_1.2,0.23784959316253662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,16,power_law_1.2,0.24236159324645995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,2,balanced,1.060314655303955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,2,balanced,1.0605599880218506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,2,power_law_1.01,0.9759360313415527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,2,power_law_1.01,1.0096320152282714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,2,power_law_1.2,1.0033472061157227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,2,power_law_1.2,1.0256896018981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,32,balanced,0.17523199319839478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,32,balanced,0.1755573352177938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,32,power_law_1.01,0.16993919610977173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,32,power_law_1.01,0.1740671992301941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,32,power_law_1.2,0.16992000341415406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,32,power_law_1.2,0.17069439888000487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,4,balanced,0.4244053363800049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,4,balanced,0.42668267091115314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,4,power_law_1.01,0.40047359466552734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,4,power_law_1.01,0.4166719913482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,4,power_law_1.2,0.42695040702819825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,4,power_law_1.2,0.4349247932434082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,8,balanced,0.35683735211690265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,8,balanced,0.3571253220240275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,8,power_law_1.01,0.33720319271087645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,8,power_law_1.01,0.3463295936584473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,8,power_law_1.2,0.34517760276794435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,1,8,power_law_1.2,0.3507711887359619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,2,1,balanced,1.068991978963216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,2,1,balanced,1.069109360376994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,2,1,power_law_1.01,0.9773951530456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,2,1,power_law_1.01,0.9818047523498535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,2,1,power_law_1.2,1.0176511764526368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,2,1,power_law_1.2,1.0305407524108887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,4,1,balanced,0.3636266787846883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,4,1,balanced,0.3638720115025838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,4,1,power_law_1.01,0.3458240032196045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,4,1,power_law_1.01,0.3470592021942139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,4,1,power_law_1.2,0.3563391923904419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,6144,2560,8,160,4,1,power_law_1.2,0.35802879333496096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,1,balanced,2.966815948486328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,1,balanced,2.96944522857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,1,power_law_1.01,2.4127872467041014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,1,power_law_1.01,2.4489919662475588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,1,power_law_1.2,2.4682111740112305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,1,power_law_1.2,2.4795711517333983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,128,balanced,0.18984532356262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,128,balanced,0.19083199898401895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,128,power_law_1.01,0.18903039693832396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,128,power_law_1.01,0.1897536039352417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,128,power_law_1.2,0.18845440149307252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,128,power_law_1.2,0.19016319513320923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,16,balanced,0.334666649500529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,16,balanced,0.3350133498509725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,16,power_law_1.01,0.3063488006591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,16,power_law_1.01,0.31727359294891355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,16,power_law_1.2,0.3115520000457764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,16,power_law_1.2,0.32072958946228025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,2,balanced,1.5565493901570637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,2,balanced,1.557978630065918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,2,power_law_1.01,1.2832063674926757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,2,power_law_1.01,1.336723232269287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,2,power_law_1.2,1.3171263694763184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,2,power_law_1.2,1.3350208282470704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,256,balanced,0.18297600746154785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,256,balanced,0.18342934052149454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,256,power_law_1.01,0.17991039752960206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,256,power_law_1.01,0.1810495972633362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,256,power_law_1.2,0.18014719486236572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,256,power_law_1.2,0.18110719919204712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,32,balanced,0.24615466594696045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,32,balanced,0.24766933917999268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,32,power_law_1.01,0.23288960456848146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,32,power_law_1.01,0.2424384117126465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,32,power_law_1.2,0.23293440341949462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,32,power_law_1.2,0.2371840000152588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,4,balanced,0.8642186323801676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,4,balanced,0.8653919696807861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,4,power_law_1.01,0.7572480201721191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,4,power_law_1.01,0.8148415565490723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,4,power_law_1.2,0.7399744033813477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,4,power_law_1.2,0.7449088096618652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,64,balanced,0.20257065693537393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,64,balanced,0.20305599768956503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,64,power_law_1.01,0.19944319725036622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,64,power_law_1.01,0.19975039958953858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,64,power_law_1.2,0.20034561157226563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,64,power_law_1.2,0.20166399478912353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,8,balanced,0.5091840028762817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,8,balanced,0.5106720129648844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,8,power_law_1.01,0.4282048225402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,8,power_law_1.01,0.4589248180389404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,8,power_law_1.2,0.4578239917755127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,1,8,power_law_1.2,0.4642752170562744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,16,1,balanced,0.39502398173014325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,16,1,balanced,0.3976000150044759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,16,1,power_law_1.01,0.360863995552063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,16,1,power_law_1.01,0.36459519863128664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,16,1,power_law_1.2,0.36090240478515623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,16,1,power_law_1.2,0.3628864049911499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,2,1,balanced,1.576709270477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,2,1,balanced,1.5767520268758137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,2,1,power_law_1.01,1.3134464263916015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,2,1,power_law_1.01,1.3263936042785645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,2,1,power_law_1.2,1.2985343933105469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,2,1,power_law_1.2,1.3305791854858398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,4,1,balanced,0.5454080104827881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,4,1,balanced,0.5477493206659952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,4,1,power_law_1.01,0.4504960060119629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,4,1,power_law_1.01,0.4579008102416992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,4,1,power_law_1.2,0.46973438262939454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,4,1,power_law_1.2,0.4729343891143799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,8,1,balanced,0.3345706860224406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,8,1,balanced,0.335258682568868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,8,1,power_law_1.01,0.2918528079986572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,8,1,power_law_1.01,0.29331839084625244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,8,1,power_law_1.2,0.2890559911727905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,256,8,1,power_law_1.2,0.2921152114868164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,1,balanced,4.39466667175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,1,balanced,4.396032015482585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,1,power_law_1.01,3.3347904205322267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,1,power_law_1.01,3.353113555908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,1,power_law_1.2,3.232998275756836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,1,power_law_1.2,3.2414272308349608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,128,balanced,0.24314133326212564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,128,balanced,0.24336532751719156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,128,power_law_1.01,0.24148480892181395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,128,power_law_1.01,0.2427903890609741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,128,power_law_1.2,0.23838720321655274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,128,power_law_1.2,0.24087679386138916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,16,balanced,0.47762131690979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,16,balanced,0.47792001565297443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,16,power_law_1.01,0.43006720542907717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,16,power_law_1.01,0.44211840629577637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,16,power_law_1.2,0.4260416030883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,16,power_law_1.2,0.4267263889312744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,2,balanced,2.296544075012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,2,balanced,2.3013386726379395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,2,power_law_1.01,1.7949184417724608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,2,power_law_1.01,1.8351360321044923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,2,power_law_1.2,1.7894399642944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,2,power_law_1.2,1.8101696014404296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,32,balanced,0.34694933891296387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,32,balanced,0.34779198964436847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,32,power_law_1.01,0.33432960510253906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,32,power_law_1.01,0.33534719944000246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,32,power_law_1.2,0.32692480087280273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,32,power_law_1.2,0.32872960567474363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,4,balanced,1.2611520290374756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,4,balanced,1.2629493077596028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,4,power_law_1.01,1.058687973022461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,4,power_law_1.01,1.1190848350524902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,4,power_law_1.2,1.009017562866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,4,power_law_1.2,1.0176192283630372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,64,balanced,0.2752373417218526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,64,balanced,0.27621867259343463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,64,power_law_1.01,0.26338560581207277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,64,power_law_1.01,0.26847999095916747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,64,power_law_1.2,0.26864640712738036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,64,power_law_1.2,0.2695168018341064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,8,balanced,0.7421973546346029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,8,balanced,0.7432746887207031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,8,power_law_1.01,0.6138879776000976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,8,power_law_1.01,0.6544000148773194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,8,power_law_1.2,0.6147136211395263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,1,8,power_law_1.2,0.6377600193023681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,16,1,balanced,0.3192960023880005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,16,1,balanced,0.32497600714365643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,16,1,power_law_1.01,0.24456961154937745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,16,1,power_law_1.01,0.24685440063476563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,16,1,power_law_1.2,0.23732481002807618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,16,1,power_law_1.2,0.23957760334014894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,2,1,balanced,2.326629320780436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,2,1,balanced,2.3282453219095864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,2,1,power_law_1.01,1.7778751373291015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,2,1,power_law_1.01,1.7872575759887694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,2,1,power_law_1.2,1.7594112396240233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,2,1,power_law_1.2,1.760051155090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,4,1,balanced,1.3176159858703613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,4,1,balanced,1.3198880354563396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,4,1,power_law_1.01,1.0048192024230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,4,1,power_law_1.01,1.011359977722168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,4,1,power_law_1.2,0.997760009765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,4,1,power_law_1.2,0.9993599891662598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,8,1,balanced,0.46690134207407635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,8,1,balanced,0.46748268604278564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,8,1,power_law_1.01,0.3547327995300293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,8,1,power_law_1.01,0.3608896017074585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,8,1,power_law_1.2,0.35285120010375975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,128,7168,2048,8,384,8,1,power_law_1.2,0.35599360466003416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,1,balanced,0.4496906598409017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,1,balanced,0.44994131724039715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,1,power_law_1.01,0.46456317901611327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,1,power_law_1.01,0.4660736083984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,1,power_law_1.2,0.4734015941619873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,1,power_law_1.2,0.4744448184967041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,128,balanced,0.14975466330846152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,128,balanced,0.1502400040626526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,128,power_law_1.01,0.15924479961395263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,128,power_law_1.01,0.15964800119400024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,128,power_law_1.2,0.16641279458999633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,128,power_law_1.2,0.16673920154571534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,16,balanced,0.167087992032369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,16,balanced,0.16878400246302286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,16,power_law_1.01,0.18227839469909668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,16,power_law_1.01,0.18517760038375855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,16,power_law_1.2,0.1887168049812317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,16,power_law_1.2,0.18934400081634523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,2,balanced,0.3158986568450928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,2,balanced,0.31674132744471234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,2,power_law_1.01,0.32817280292510986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,2,power_law_1.01,0.335263991355896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,2,power_law_1.2,0.33919360637664797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,2,power_law_1.2,0.35333120822906494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,32,balanced,0.15688533584276834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,32,balanced,0.15768000483512878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,32,power_law_1.01,0.1702720046043396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,32,power_law_1.01,0.1739967942237854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,32,power_law_1.2,0.17788159847259521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,32,power_law_1.2,0.18024319410324097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,4,balanced,0.23190399010976157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,4,balanced,0.23324267069498697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,4,power_law_1.01,0.2504192113876343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,4,power_law_1.01,0.25055999755859376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,4,power_law_1.2,0.2581952095031738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,4,power_law_1.2,0.27229440212249756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,64,balanced,0.15235199530919394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,64,balanced,0.15255999565124512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,64,power_law_1.01,0.16146559715270997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,64,power_law_1.01,0.16348799467086791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,64,power_law_1.2,0.16952320337295532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,64,power_law_1.2,0.17411839962005615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,8,balanced,0.18992533286412558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,8,balanced,0.19107733170191446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,8,power_law_1.01,0.20556159019470216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,8,power_law_1.01,0.20972158908843994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,8,power_law_1.2,0.21451520919799805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,1,8,power_law_1.2,0.21551361083984374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,2,1,balanced,0.2835200031598409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,2,1,balanced,0.28537599245707196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,2,1,power_law_1.01,0.28964478969573976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,2,1,power_law_1.01,0.28988161087036135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,2,1,power_law_1.2,0.2908927917480469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,2048,768,8,128,2,1,power_law_1.2,0.29253759384155276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,1,balanced,1.224725325902303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,1,balanced,1.225162665049235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,1,power_law_1.01,1.531436824798584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,1,power_law_1.01,1.532204818725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,1,power_law_1.2,1.5650879859924316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,1,power_law_1.2,1.5991552352905274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,128,balanced,0.2667679985364278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,128,balanced,0.26689066489537555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,128,power_law_1.01,0.28672640323638915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,128,power_law_1.01,0.2886591911315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,128,power_law_1.2,0.29079039096832277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,128,power_law_1.2,0.2994623899459839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,16,balanced,0.32449066638946533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,16,balanced,0.32635732491811115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,16,power_law_1.01,0.36833279132843016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,16,power_law_1.01,0.38163840770721436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,16,power_law_1.2,0.3839359998703003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,16,power_law_1.2,0.3896575927734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,2,balanced,0.7634186744689941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,2,balanced,0.7634507020314535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,2,power_law_1.01,0.903264045715332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,2,power_law_1.01,0.9098688125610351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,2,power_law_1.2,0.9568639755249023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,2,power_law_1.2,0.9606080055236816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,256,balanced,0.263045330842336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,256,balanced,0.2634986639022827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,256,power_law_1.01,0.27448320388793945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,256,power_law_1.01,0.27518720626831056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,256,power_law_1.2,0.2832256078720093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,256,power_law_1.2,0.2862528085708618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,32,balanced,0.29127999146779376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,32,balanced,0.29180800914764404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,32,power_law_1.01,0.32576000690460205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,32,power_law_1.01,0.3291968107223511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,32,power_law_1.2,0.3365504026412964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,32,power_law_1.2,0.3408639907836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,4,balanced,0.5206773281097412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,4,balanced,0.5208746592203776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,4,power_law_1.01,0.6094399929046631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,4,power_law_1.01,0.6265215873718262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,4,power_law_1.2,0.644697618484497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,4,power_law_1.2,0.6593344211578369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,64,balanced,0.2735733389854431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,64,balanced,0.27454932530721027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,64,power_law_1.01,0.30280959606170654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,64,power_law_1.01,0.30349440574645997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,64,power_law_1.2,0.3108031988143921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,64,power_law_1.2,0.3128511905670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,8,balanced,0.39047467708587646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,8,balanced,0.390613317489624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,8,power_law_1.01,0.4606527805328369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,8,power_law_1.01,0.46156158447265627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,8,power_law_1.2,0.4700160026550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,1,8,power_law_1.2,0.4703360080718994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,2,1,balanced,0.6992746988932291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,2,1,balanced,0.7015519936879476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,2,1,power_law_1.01,0.851039981842041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,2,1,power_law_1.01,0.8520256042480469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,2,1,power_law_1.2,0.8844223976135254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,2,1,power_law_1.2,0.8922559738159179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,4,1,balanced,0.439301331837972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,4,1,balanced,0.4405920108159383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,4,1,power_law_1.01,0.5228928089141845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,4,1,power_law_1.01,0.5240896224975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,4,1,power_law_1.2,0.530515193939209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,3072,1536,8,256,4,1,power_law_1.2,0.5327936172485351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,1,balanced,2.265168031056722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,1,balanced,2.265903949737549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,1,power_law_1.01,2.3403648376464843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,1,power_law_1.01,2.357529640197754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,1,power_law_1.2,2.3398080825805665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,1,power_law_1.2,2.3658687591552736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,2,balanced,1.2964959939320881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,2,balanced,1.2968053023020427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,2,power_law_1.01,1.6191871643066407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,2,power_law_1.01,1.702003288269043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,2,power_law_1.2,1.5523391723632813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,2,power_law_1.2,1.598585605621338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,4,balanced,0.8698240121205648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,4,balanced,0.8709440231323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,4,power_law_1.01,1.2985024452209473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,4,power_law_1.01,1.3553983688354492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,4,power_law_1.2,1.3672191619873046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,4,power_law_1.2,1.383788776397705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,8,balanced,0.6017386515935262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,8,balanced,0.6031893491744995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,8,power_law_1.01,1.16496000289917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,8,power_law_1.01,1.2015616416931152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,8,power_law_1.2,1.1954560279846191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,1,8,power_law_1.2,1.212070369720459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,16,1,balanced,0.2242400050163269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,16,1,balanced,0.22635199626286825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,16,1,power_law_1.01,0.22396159172058105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,16,1,power_law_1.01,0.22734720706939698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,16,1,power_law_1.2,0.22606079578399657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,16,1,power_law_1.2,0.22700800895690917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,2,1,balanced,1.1652106444040935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,2,1,balanced,1.1653707027435303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,2,1,power_law_1.01,1.1997504234313965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,2,1,power_law_1.01,1.2079104423522948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,2,1,power_law_1.2,1.1970751762390137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,2,1,power_law_1.2,1.1991616249084474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,4,1,balanced,0.6294186512629191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,4,1,balanced,0.6320799986521403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,4,1,power_law_1.01,0.6322559833526611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,4,1,power_law_1.01,0.6483583927154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,4,1,power_law_1.2,0.6357056140899658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,4,1,power_law_1.2,0.6375936031341553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,8,1,balanced,0.3519306580225627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,8,1,balanced,0.35210132598876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,8,1,power_law_1.01,0.35452799797058104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,8,1,power_law_1.01,0.3626431941986084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,8,1,power_law_1.2,0.3545216083526611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,14336,2,8,8,1,power_law_1.2,0.35635199546813967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,1,balanced,1.386415958404541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,1,balanced,1.3882346153259277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,1,power_law_1.01,1.4862144470214844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,1,power_law_1.01,1.4931584358215333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,1,power_law_1.2,1.515494441986084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,1,power_law_1.2,1.5240127563476562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,128,balanced,0.27166932821273804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,128,balanced,0.27240000168482464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,128,power_law_1.01,0.30290560722351073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,128,power_law_1.01,0.3119679927825928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,128,power_law_1.2,0.32926719188690184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,128,power_law_1.2,0.344051194190979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,16,balanced,0.3338666756947835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,16,balanced,0.3343413273493449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,16,power_law_1.01,0.39613440036773684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,16,power_law_1.01,0.3998080015182495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,16,power_law_1.2,0.4000959873199463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,16,power_law_1.2,0.4101888179779053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,2,balanced,0.8441973527272543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,2,balanced,0.8446239630381266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,2,power_law_1.01,0.9330559730529785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,2,power_law_1.01,0.9625408172607421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,2,power_law_1.2,0.9375040054321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,2,power_law_1.2,0.9442496299743652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,32,balanced,0.2972000042597453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,32,balanced,0.2988106608390808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,32,power_law_1.01,0.345798397064209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,32,power_law_1.01,0.3531264066696167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,32,power_law_1.2,0.36856319904327395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,32,power_law_1.2,0.38915200233459474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,4,balanced,0.5577653249104818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,4,balanced,0.5579839944839478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,4,power_law_1.01,0.6188672065734864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,4,power_law_1.01,0.6379648208618164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,4,power_law_1.2,0.6545728206634521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,4,power_law_1.2,0.6771711826324462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,64,balanced,0.2785759965578715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,64,balanced,0.27923200527826947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,64,power_law_1.01,0.3236032009124756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,64,power_law_1.01,0.3271615982055664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,64,power_law_1.2,0.35401599407196044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,64,power_law_1.2,0.35790719985961916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,8,balanced,0.41043734550476074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,8,balanced,0.41199998060862225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,8,power_law_1.01,0.48972158432006835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,8,power_law_1.01,0.49692797660827637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,8,power_law_1.2,0.48418560028076174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,1,8,power_law_1.2,0.530675220489502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,2,1,balanced,0.7964213689168295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,2,1,balanced,0.7989439964294434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,2,1,power_law_1.01,0.8275456428527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,2,1,power_law_1.01,0.8301952362060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,2,1,power_law_1.2,0.8352255821228027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,2,1,power_law_1.2,0.836729621887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,4,1,balanced,0.5003893375396729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,4,1,balanced,0.5007626612981161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,4,1,power_law_1.01,0.5090303897857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,4,1,power_law_1.01,0.5112512111663818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,4,1,power_law_1.2,0.512275218963623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,1536,8,128,4,1,power_law_1.2,0.512998390197754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,1,balanced,8.72768529256185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,1,balanced,8.72922134399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,1,power_law_1.01,7.692620849609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,1,power_law_1.01,7.7259521484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,1,power_law_1.2,7.8988800048828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,1,power_law_1.2,7.926822662353516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,128,balanced,1.016650676727295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,128,balanced,1.0166773001352947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,128,power_law_1.01,1.0721343994140624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,128,power_law_1.01,1.087071990966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,128,power_law_1.2,1.1260095596313477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,128,power_law_1.2,1.1343744277954102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,16,balanced,1.4529600143432617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,16,balanced,1.453759988149007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,16,power_law_1.01,1.5215231895446777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,16,power_law_1.01,1.535852813720703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,16,power_law_1.2,1.5575039863586426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,16,power_law_1.2,1.5806912422180175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,2,balanced,4.877114613850911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,2,balanced,4.878224054972331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,2,power_law_1.01,4.405920028686523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,2,power_law_1.01,4.471705627441406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,2,power_law_1.2,4.650566482543946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,2,power_law_1.2,4.672505569458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,256,balanced,0.9843893051147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,256,balanced,0.9870453675587972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,256,power_law_1.01,1.043776035308838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,256,power_law_1.01,1.0520895957946776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,256,power_law_1.2,1.0800448417663575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,256,power_law_1.2,1.10316162109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,32,balanced,1.2023146947224934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,32,balanced,1.2026080290476482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,32,power_law_1.01,1.2624640464782715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,32,power_law_1.01,1.2844736099243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,32,power_law_1.2,1.3117759704589844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,32,power_law_1.2,1.3534463882446288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,4,balanced,2.9204479853312173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,4,balanced,2.9236052831014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,4,power_law_1.01,2.8075008392333984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,4,power_law_1.01,2.840889549255371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,4,power_law_1.2,2.873836708068848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,4,power_law_1.2,2.9431936264038088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,64,balanced,1.0751573244730632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,64,balanced,1.0810080369313557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,64,power_law_1.01,1.155628776550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,64,power_law_1.01,1.1590847969055176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,64,power_law_1.2,1.1895808219909667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,64,power_law_1.2,1.2093567848205566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,8,balanced,1.943343957265218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,8,balanced,1.9486026763916016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,8,power_law_1.01,1.9438655853271485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,8,power_law_1.01,1.9716608047485351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,8,power_law_1.2,2.0041536331176757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,4096,2688,22,512,1,8,power_law_1.2,2.037766456604004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,1,balanced,3.542703946431478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,1,balanced,3.544117291768392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,1,power_law_1.01,3.810598373413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,1,power_law_1.01,3.8444862365722656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,1,power_law_1.2,3.7660736083984374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,1,power_law_1.2,3.8149185180664062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,2,balanced,1.9564053217569988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,2,balanced,1.9587039947509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,2,power_law_1.01,2.474803161621094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,2,power_law_1.01,2.59616641998291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,2,power_law_1.2,2.5672319412231444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,2,power_law_1.2,2.831110382080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,4,balanced,1.1770026683807373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,4,balanced,1.1780107021331787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,4,power_law_1.01,1.9854591369628907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,4,power_law_1.01,1.9956031799316407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,4,power_law_1.2,2.02096004486084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,4,power_law_1.2,2.0959871292114256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,8,balanced,0.7860853672027588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,8,balanced,0.7889706293741862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,8,power_law_1.01,1.8165056228637695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,8,power_law_1.01,1.8223936080932617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,8,power_law_1.2,1.8569343566894532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,1,8,power_law_1.2,1.876793670654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,16,1,balanced,0.322869340578715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,16,1,balanced,0.3238826592763265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,16,1,power_law_1.01,0.3278271913528442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,16,1,power_law_1.01,0.33043200969696046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,16,1,power_law_1.2,0.33000960350036623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,16,1,power_law_1.2,0.33123838901519775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,2,1,balanced,1.8081386884053547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,2,1,balanced,1.8082559903462727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,2,1,power_law_1.01,1.9173887252807618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,2,1,power_law_1.01,1.9385856628417968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,2,1,power_law_1.2,1.92806396484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,2,1,power_law_1.2,1.9362239837646484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,32,1,balanced,0.2305226723353068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,32,1,balanced,0.23079466819763184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,32,1,power_law_1.01,0.23016960620880128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,32,1,power_law_1.01,0.23534080982208253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,32,1,power_law_1.2,0.23352959156036376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,32,1,power_law_1.2,0.23582720756530762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,4,1,balanced,0.9695253372192383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,4,1,balanced,0.9702880382537842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,4,1,power_law_1.01,1.0281408309936524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,4,1,power_law_1.01,1.0317824363708497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,4,1,power_law_1.2,1.01910400390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,4,1,power_law_1.2,1.0229632377624511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,8,1,balanced,0.552016019821167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,8,1,balanced,0.5523200035095215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,8,1,power_law_1.01,0.563647985458374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,8,1,power_law_1.01,0.5687744140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,8,1,power_law_1.2,0.566323184967041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,16384,2,8,8,1,power_law_1.2,0.5681407928466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,1,balanced,2.881183942159017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,1,balanced,2.882949193318685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,1,power_law_1.01,3.6600128173828126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,1,power_law_1.01,3.712633514404297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,1,power_law_1.2,3.852889633178711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,1,power_law_1.2,3.8850494384765626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,128,balanced,0.4230026801427205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,128,balanced,0.42341868082682294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,128,power_law_1.01,0.4785151958465576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,128,power_law_1.01,0.47954559326171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,128,power_law_1.2,0.4954559803009033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,128,power_law_1.2,0.5014207839965821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,16,balanced,0.5646346807479858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,16,balanced,0.565285325050354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,16,power_law_1.01,0.6660287857055665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,16,power_law_1.01,0.683839988708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,16,power_law_1.2,0.7116864204406739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,16,power_law_1.2,0.7307648181915283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,2,balanced,1.6720479329427083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,2,balanced,1.6749547322591145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,2,power_law_1.01,2.0883199691772463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,2,power_law_1.01,2.1411264419555662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,2,power_law_1.2,2.164684867858887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,2,power_law_1.2,2.2837055206298826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,256,balanced,0.4174559911092122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,256,balanced,0.41765332221984863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,256,power_law_1.01,0.45121278762817385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,256,power_law_1.01,0.455020809173584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,256,power_law_1.2,0.4806335926055908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,256,power_law_1.2,0.4859776020050049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,32,balanced,0.48315199216206867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,32,balanced,0.48339200019836426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,32,power_law_1.01,0.5686912059783935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,32,power_law_1.01,0.5706560134887695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,32,power_law_1.2,0.596230411529541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,32,power_law_1.2,0.6177472114562989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,4,balanced,1.048426628112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,4,balanced,1.048688014348348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,4,power_law_1.01,1.286297607421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,4,power_law_1.01,1.3012288093566895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,4,power_law_1.2,1.3521984100341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,4,power_law_1.2,1.355743980407715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,64,balanced,0.4399840037027995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,64,balanced,0.4412959814071655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,64,power_law_1.01,0.5113408088684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,64,power_law_1.01,0.5184768199920654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,64,power_law_1.2,0.5313727855682373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,64,power_law_1.2,0.5462592124938965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,8,balanced,0.7281973361968994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,8,balanced,0.7296053568522135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,8,power_law_1.01,0.9096447944641113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,8,power_law_1.01,0.9243583679199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,8,power_law_1.2,0.9344767570495606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,1,8,power_law_1.2,1.0300288200378418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,16,1,balanced,0.4746239980061849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,16,1,balanced,0.47486400604248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,16,1,power_law_1.01,0.5703807830810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,16,1,power_law_1.01,0.570636796951294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,16,1,power_law_1.2,0.5797440052032471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,16,1,power_law_1.2,0.5799295902252197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,2,1,balanced,1.5692159334818523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,2,1,balanced,1.5703520774841309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,2,1,power_law_1.01,1.9905471801757812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,2,1,power_law_1.01,2.010963249206543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,2,1,power_law_1.2,2.0704063415527343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,2,1,power_law_1.2,2.0854207992553713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,4,1,balanced,0.9058240254720052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,4,1,balanced,0.9071893692016602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,4,1,power_law_1.01,1.1303487777709962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,4,1,power_law_1.01,1.1355839729309083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,4,1,power_law_1.2,1.1821375846862794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,4,1,power_law_1.2,1.1850815773010255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,8,1,balanced,0.6598506768544515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,8,1,balanced,0.660154660542806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,8,1,power_law_1.01,0.7511040210723877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,8,1,power_law_1.01,0.7522751808166503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,8,1,power_law_1.2,0.7593728065490722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2048,8,256,8,1,power_law_1.2,0.760211181640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,1,balanced,3.890351931254069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,1,balanced,3.8904266357421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,1,power_law_1.01,3.6636863708496095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,1,power_law_1.01,3.6939327239990236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,1,power_law_1.2,3.7782207489013673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,1,power_law_1.2,3.779897689819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,16,balanced,0.6311839818954468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,16,balanced,0.6320426861445109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,16,power_law_1.01,0.7130112171173095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,16,power_law_1.01,0.7469120025634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,16,power_law_1.2,0.7961279869079589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,16,power_law_1.2,0.8148159980773926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,2,balanced,2.1615519523620605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,2,balanced,2.1625760396321616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,2,power_law_1.01,2.1490175247192385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,2,power_law_1.01,2.256339263916016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,2,power_law_1.2,2.1648576736450194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,2,power_law_1.2,2.2133056640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,32,balanced,0.51583464940389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,32,balanced,0.5160746574401855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,32,power_law_1.01,0.6096511840820312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,32,power_law_1.01,0.617907190322876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,32,power_law_1.2,0.6616191864013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,32,power_law_1.2,0.6885312080383301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,4,balanced,1.2772213617960613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,4,balanced,1.277791976928711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,4,power_law_1.01,1.3605312347412108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,4,power_law_1.01,1.3869440078735351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,4,power_law_1.2,1.4012160301208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,4,power_law_1.2,1.456505584716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,8,balanced,0.8441387017567953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,8,balanced,0.8453280131022135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,8,power_law_1.01,0.9281279563903808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,8,power_law_1.01,0.9438976287841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,8,power_law_1.2,0.9738559722900391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,1,8,power_law_1.2,0.9992768287658691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,2,1,balanced,2.087813377380371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,2,1,balanced,2.090010643005371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,2,1,power_law_1.01,1.9983936309814454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,2,1,power_law_1.01,2.0000255584716795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,2,1,power_law_1.2,2.0332735061645506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,2,1,power_law_1.2,2.0593408584594726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,4,1,balanced,1.1599360307057698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,4,1,balanced,1.1602880160013835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,4,1,power_law_1.01,1.1280256271362306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,4,1,power_law_1.01,1.1352319717407227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,4,1,power_law_1.2,1.1445887565612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,6144,2560,8,160,4,1,power_law_1.2,1.1534655570983887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,1,balanced,3.3228321075439453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,1,balanced,3.325951894124349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,1,power_law_1.01,4.244966506958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,1,power_law_1.01,4.278483200073242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,1,power_law_1.2,4.416435241699219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,1,power_law_1.2,4.446758270263672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,128,balanced,0.457045316696167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,128,balanced,0.45916799704233807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,128,power_law_1.01,0.513478422164917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,128,power_law_1.01,0.5200191974639893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,128,power_law_1.2,0.5502079963684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,128,power_law_1.2,0.5600192070007324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,16,balanced,0.6236213445663452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,16,balanced,0.6247146526972452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,16,power_law_1.01,0.7703680038452149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,16,power_law_1.01,0.7760640144348144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,16,power_law_1.2,0.8119872093200684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,16,power_law_1.2,0.8333248138427735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,2,balanced,1.9184692700703938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,2,balanced,1.92031462987264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,2,power_law_1.01,2.406175994873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,2,power_law_1.01,2.4244543075561524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,2,power_law_1.2,2.5214208602905273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,2,power_law_1.2,2.614054489135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,256,balanced,0.4490346511205037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,256,balanced,0.45047998428344727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,256,power_law_1.01,0.49047040939331055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,256,power_law_1.01,0.49504637718200684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,256,power_law_1.2,0.5263487815856933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,256,power_law_1.2,0.5315711975097657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,32,balanced,0.527184009552002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,32,balanced,0.5291733344395956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,32,power_law_1.01,0.6348288059234619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,32,power_law_1.01,0.6502208232879638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,32,power_law_1.2,0.6669951915740967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,32,power_law_1.2,0.6786816120147705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,4,balanced,1.185546636581421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,4,balanced,1.1874293486277263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,4,power_law_1.01,1.5242560386657715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,4,power_law_1.01,1.5359935760498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,4,power_law_1.2,1.6223743438720704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,4,power_law_1.2,1.6418495178222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,64,balanced,0.4780106544494629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,64,balanced,0.4782239993413289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,64,power_law_1.01,0.5621376037597656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,64,power_law_1.01,0.5721727848052979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,64,power_law_1.2,0.576793622970581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,64,power_law_1.2,0.5982848167419433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,8,balanced,0.8175520102183024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,8,balanced,0.8204747041066488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,8,power_law_1.01,1.0269248008728027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,8,power_law_1.01,1.0392191886901856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,8,power_law_1.2,1.0737215995788574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,1,8,power_law_1.2,1.0938688278198243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,16,1,balanced,0.5440746545791626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,16,1,balanced,0.545578678448995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,16,1,power_law_1.01,0.6547967910766601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,16,1,power_law_1.01,0.6584703922271729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,16,1,power_law_1.2,0.6662528038024902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,16,1,power_law_1.2,0.6678143978118897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,2,1,balanced,1.814794699350993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,2,1,balanced,1.817098617553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,2,1,power_law_1.01,2.2947647094726564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,2,1,power_law_1.01,2.308691215515137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,2,1,power_law_1.2,2.403430366516113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,2,1,power_law_1.2,2.4314943313598634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,4,1,balanced,1.0472373167673747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,4,1,balanced,1.0472746690114338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,4,1,power_law_1.01,1.3041088104248046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,4,1,power_law_1.01,1.3241600036621093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,4,1,power_law_1.2,1.367961597442627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,4,1,power_law_1.2,1.368889617919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,8,1,balanced,0.7610026995340983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,8,1,balanced,0.7629973093668619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,8,1,power_law_1.01,0.8670016288757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,8,1,power_law_1.01,0.8687040328979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,8,1,power_law_1.2,0.8763456344604492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,256,8,1,power_law_1.2,0.8779071807861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,1,balanced,4.805791854858398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,1,balanced,4.806293487548828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,1,power_law_1.01,5.195654296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,1,power_law_1.01,5.243743896484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,1,power_law_1.2,5.414214324951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,1,power_law_1.2,5.418022537231446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,128,balanced,0.5233706633249918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,128,balanced,0.523850679397583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,128,power_law_1.01,0.5688127994537353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,128,power_law_1.01,0.5762368202209472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,128,power_law_1.2,0.5939583778381348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,128,power_law_1.2,0.6011712074279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,16,balanced,0.7676959832509359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,16,balanced,0.7696373462677002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,16,power_law_1.01,0.8231871604919434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,16,power_law_1.01,0.8567168235778808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,16,power_law_1.2,0.8914560317993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,16,power_law_1.2,0.9090304374694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,2,balanced,2.679194768269857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,2,balanced,2.680250803629557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,2,power_law_1.01,2.9186559677124024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,2,power_law_1.01,2.9759679794311524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,2,power_law_1.2,3.0011007308959963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,2,power_law_1.2,3.0511999130249023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,32,balanced,0.6309653520584106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,32,balanced,0.6326133410135905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,32,power_law_1.01,0.6923840045928955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,32,power_law_1.01,0.7104512214660644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,32,power_law_1.2,0.7355135917663574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,32,power_law_1.2,0.7372608184814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,4,balanced,1.5918879508972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,4,balanced,1.597808043162028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,4,power_law_1.01,1.7480575561523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,4,power_law_1.01,1.8234752655029296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,4,power_law_1.2,1.7474624633789062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,4,power_law_1.2,1.8268863677978515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,64,balanced,0.5550666650136312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,64,balanced,0.557370662689209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,64,power_law_1.01,0.612172794342041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,64,power_law_1.01,0.6261824131011963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,64,power_law_1.2,0.6422399997711181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,64,power_law_1.2,0.6484416007995606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,8,balanced,1.048415978749593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,8,balanced,1.0488959948221843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,8,power_law_1.01,1.1924223899841309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,8,power_law_1.01,1.1956159591674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,8,power_law_1.2,1.2357312202453614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,1,8,power_law_1.2,1.2563136100769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,16,1,balanced,0.5134773254394531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,16,1,balanced,0.5144799947738647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,16,1,power_law_1.01,0.6720767974853515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,16,1,power_law_1.01,0.6738368034362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,16,1,power_law_1.2,0.6815743923187256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,16,1,power_law_1.2,0.6846144199371338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,2,1,balanced,2.587834676106771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,2,1,balanced,2.5886665980021157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,2,1,power_law_1.01,2.821926307678223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,2,1,power_law_1.01,2.852799987792969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,2,1,power_law_1.2,2.938982391357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,2,1,power_law_1.2,2.9627904891967773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,4,1,balanced,1.5235466957092285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,4,1,balanced,1.5240160624186199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,4,1,power_law_1.01,1.639967918395996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,4,1,power_law_1.01,1.6444223403930665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,4,1,power_law_1.2,1.6702592849731446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,4,1,power_law_1.2,1.6795007705688476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,8,1,balanced,0.7233813603719076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,8,1,balanced,0.72380264600118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,8,1,power_law_1.01,0.9541440010070801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,8,1,power_law_1.01,0.9598400115966796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,8,1,power_law_1.2,0.9858943939208984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,1536,7168,2048,8,384,8,1,power_law_1.2,0.9890496253967285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,1,balanced,0.1381066640218099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,1,balanced,0.13838932911554971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,1,power_law_1.01,0.08856959939002991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,1,power_law_1.01,0.09207040071487427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,1,power_law_1.2,0.08684160113334656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,1,power_law_1.2,0.08944640159606934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,128,balanced,0.03745066622893015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,128,balanced,0.03782933453718821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,128,power_law_1.01,0.03561600148677826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,128,power_law_1.01,0.036032000184059144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,128,power_law_1.2,0.035180801153182985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,16,balanced,0.037477334340413414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,16,balanced,0.039290666580200195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,16,power_law_1.01,0.036422398686408994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,16,power_law_1.01,0.03683840036392212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,16,power_law_1.2,0.036422398686408994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,16,power_law_1.2,0.03669120073318481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,2,balanced,0.09231999516487122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,2,balanced,0.09498133261998494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,2,power_law_1.01,0.06472960114479065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,2,power_law_1.01,0.06664320230484008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,2,power_law_1.2,0.06362879872322083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,2,power_law_1.2,0.06407679915428162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,32,balanced,0.035690667728583016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,32,balanced,0.03757333258787791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,32,power_law_1.01,0.03588480055332184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,32,power_law_1.01,0.03598720133304596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,32,power_law_1.2,0.0364544004201889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,32,power_law_1.2,0.036934399604797365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,4,balanced,0.06228266656398773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,4,balanced,0.06414400041103363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,4,power_law_1.01,0.05055999755859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,4,power_law_1.01,0.0521664023399353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,4,power_law_1.2,0.049318400025367734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,4,power_law_1.2,0.052300798892974856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,64,balanced,0.03570666660865148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,64,balanced,0.03754133234421412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,64,power_law_1.01,0.03531520068645477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,64,power_law_1.01,0.03566080033779144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,64,power_law_1.2,0.035180801153182985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,64,power_law_1.2,0.03617280125617981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,8,balanced,0.04472533365090688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,8,balanced,0.045834665497144066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,8,power_law_1.01,0.043782401084899905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,8,power_law_1.01,0.044531199336051944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,8,power_law_1.2,0.04267520010471344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,1,8,power_law_1.2,0.04314880073070526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,2,1,balanced,0.09796266754468282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,2,1,balanced,0.09885866443316142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,2,1,power_law_1.01,0.061504000425338747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,2,1,power_law_1.01,0.06209279894828797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,2,1,power_law_1.2,0.05916799902915955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,2048,768,8,128,2,1,power_law_1.2,0.06144639849662781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,1,balanced,0.33370665709177655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,1,balanced,0.334112008412679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,1,power_law_1.01,0.2532543897628784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,1,power_law_1.01,0.2579967975616455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,1,power_law_1.2,0.23523199558258057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,1,power_law_1.2,0.23601279258728028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,128,balanced,0.042026668787002563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,128,balanced,0.04357333481311798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,128,power_law_1.01,0.04298880100250244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,128,power_law_1.01,0.04398080110549927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,128,power_law_1.2,0.042745599150657655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,128,power_law_1.2,0.042982399463653564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,16,balanced,0.062208001812299095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,16,balanced,0.062277331948280334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,16,power_law_1.01,0.07637760043144226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,16,power_law_1.01,0.07692800164222717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,16,power_law_1.2,0.07286400198936463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,16,power_law_1.2,0.07612159848213196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,2,balanced,0.19113600254058838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,2,balanced,0.19335466623306274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,2,power_law_1.01,0.17529599666595458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,2,power_law_1.01,0.1828223943710327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,2,power_law_1.2,0.1536064028739929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,2,power_law_1.2,0.1684224009513855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,256,balanced,0.041850666205088295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,256,balanced,0.043920000394185386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,256,power_law_1.01,0.04357759952545166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,256,power_law_1.01,0.04376960098743439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,256,power_law_1.2,0.043756800889968875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,256,power_law_1.2,0.04385280013084412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,32,balanced,0.0459146648645401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,32,balanced,0.04764799773693085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,32,power_law_1.01,0.05479679703712463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,32,power_law_1.01,0.061375999450683595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,32,power_law_1.2,0.058380800485610965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,32,power_law_1.2,0.05937280058860779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,4,balanced,0.12754133343696594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,4,balanced,0.1280586620171865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,4,power_law_1.01,0.1278656005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,4,power_law_1.01,0.12972160577774047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,4,power_law_1.2,0.1223296046257019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,4,power_law_1.2,0.12412159442901612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,64,balanced,0.04394133388996124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,64,balanced,0.045781334241231285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,64,power_law_1.01,0.046540799736976626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,64,power_law_1.01,0.0466048002243042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,64,power_law_1.2,0.045023998618125914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,64,power_law_1.2,0.04598399996757507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,8,balanced,0.07706666489442189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,8,balanced,0.07890666524569194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,8,power_law_1.01,0.10535039901733398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,8,power_law_1.01,0.10597759485244751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,8,power_law_1.2,0.10654720067977905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,1,8,power_law_1.2,0.10970879793167114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,2,1,balanced,0.19013333320617676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,2,1,balanced,0.1901706655820211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,2,1,power_law_1.01,0.14408960342407226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,2,1,power_law_1.01,0.1519871950149536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,2,1,power_law_1.2,0.1392832040786743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,2,1,power_law_1.2,0.13932160139083863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,4,1,balanced,0.12938132882118225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,4,1,balanced,0.12941867113113403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,4,1,power_law_1.01,0.10348800420761109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,4,1,power_law_1.01,0.103603196144104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,4,1,power_law_1.2,0.08810880184173583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,3072,1536,8,256,4,1,power_law_1.2,0.08931840062141419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,1,balanced,0.28495466709136963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,1,balanced,0.2877546747525533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,1,power_law_1.01,0.2722752094268799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,1,power_law_1.01,0.2814784049987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,1,power_law_1.2,0.28136320114135743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,1,power_law_1.2,0.2838527917861938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,2,balanced,0.20322666565577188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,2,balanced,0.20865599314371744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,2,power_law_1.01,0.1973312020301819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,2,power_law_1.01,0.1985152006149292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,2,power_law_1.2,0.19685759544372558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,2,power_law_1.2,0.19818240404129028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,4,balanced,0.14569600423177084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,4,balanced,0.14634133378664652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,4,power_law_1.01,0.1444991946220398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,4,power_law_1.01,0.14495359659194945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,4,power_law_1.2,0.14864640235900878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,4,power_law_1.2,0.1506495952606201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,8,balanced,0.12844799955685934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,8,balanced,0.1286079982916514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,8,power_law_1.01,0.12807680368423463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,8,power_law_1.01,0.1284351944923401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,8,power_law_1.2,0.12862720489501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,1,8,power_law_1.2,0.12922879457473754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,16,1,balanced,0.05143466591835022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,16,1,balanced,0.052015999952952065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,16,1,power_law_1.01,0.04862079918384552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,16,1,power_law_1.01,0.05072640180587769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,16,1,power_law_1.2,0.05014399886131286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,16,1,power_law_1.2,0.051609599590301515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,2,1,balanced,0.1602026621500651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,2,1,balanced,0.16197866201400757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,2,1,power_law_1.01,0.15794559717178344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,2,1,power_law_1.01,0.15982719659805297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,2,1,power_law_1.2,0.15740159749984742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,2,1,power_law_1.2,0.15931520462036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,4,1,balanced,0.09271466732025146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,4,1,balanced,0.10125866532325745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,4,1,power_law_1.01,0.0913919985294342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,4,1,power_law_1.01,0.09191039800643921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,4,1,power_law_1.2,0.09100160002708435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,4,1,power_law_1.2,0.09137920141220093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,8,1,balanced,0.06621333460013072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,8,1,balanced,0.06622399886449178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,8,1,power_law_1.01,0.06403840184211732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,8,1,power_law_1.01,0.0643775999546051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,8,1,power_law_1.2,0.06391680240631104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,14336,2,8,8,1,power_law_1.2,0.06435199975967407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,1,balanced,0.41881601015726727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,1,balanced,0.4190186659495036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,1,power_law_1.01,0.23065600395202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,1,power_law_1.01,0.2349695920944214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,1,power_law_1.2,0.2256319999694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,1,power_law_1.2,0.22815999984741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,128,balanced,0.0459146648645401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,128,balanced,0.047925333182017006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,128,power_law_1.01,0.04596480131149292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,128,power_law_1.01,0.0461760014295578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,128,power_law_1.2,0.045900800824165346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,128,power_law_1.2,0.04640640020370483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,16,balanced,0.07043200234572093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,16,balanced,0.07156266768773396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,16,power_law_1.01,0.0630016028881073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,16,power_law_1.01,0.06696959733963012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,16,power_law_1.2,0.060288000106811526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,16,power_law_1.2,0.06423680186271667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,2,balanced,0.23698665698369345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,2,balanced,0.2427146633466085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,2,power_law_1.01,0.15306880474090576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,2,power_law_1.01,0.15529600381851197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,2,power_law_1.2,0.14609919786453246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,2,power_law_1.2,0.14860160350799562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,32,balanced,0.05598933498064677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,32,balanced,0.056015998125076294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,32,power_law_1.01,0.053452801704406736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,32,power_law_1.01,0.0548799991607666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,32,power_law_1.2,0.05255039930343628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,32,power_law_1.2,0.05271040201187134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,4,balanced,0.14754133423169455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,4,balanced,0.15014400084813437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,4,power_law_1.01,0.10069760084152221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,4,power_law_1.01,0.10820480585098266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,4,power_law_1.2,0.10331519842147827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,4,power_law_1.2,0.11910400390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,64,balanced,0.04783466458320618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,64,balanced,0.0479360024134318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,64,power_law_1.01,0.04630399942398071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,64,power_law_1.01,0.04644480049610138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,64,power_law_1.2,0.04636160135269165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,64,power_law_1.2,0.0465472012758255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,8,balanced,0.08973333239555359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,8,balanced,0.0904853343963623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,8,power_law_1.01,0.07431039810180665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,8,power_law_1.01,0.08464000225067139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,8,power_law_1.2,0.0720192015171051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,1,8,power_law_1.2,0.0730239987373352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,2,1,balanced,0.2339786688486735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,2,1,balanced,0.23527467250823975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,2,1,power_law_1.01,0.14929920434951782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,2,1,power_law_1.01,0.15109119415283204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,2,1,power_law_1.2,0.14450559616088868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,2,1,power_law_1.2,0.14558720588684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,4,1,balanced,0.1604693333307902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,4,1,balanced,0.1606666644414266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,4,1,power_law_1.01,0.0942143976688385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,4,1,power_law_1.01,0.09520000219345093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,4,1,power_law_1.2,0.08517760038375854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,1536,8,128,4,1,power_law_1.2,0.09023360013961793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,1,balanced,1.823344071706136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,1,balanced,1.8259199460347493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,1,power_law_1.01,1.1920831680297852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,1,power_law_1.01,1.2118399620056153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,1,power_law_1.2,1.0743935585021973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,1,power_law_1.2,1.0783040046691894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,128,balanced,0.07959466675917308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,128,balanced,0.08001066744327545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,128,power_law_1.01,0.07477120161056519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,128,power_law_1.01,0.07527040243148804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,128,power_law_1.2,0.07485439777374267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,128,power_law_1.2,0.07502719759941101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,16,balanced,0.19657599925994873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,16,balanced,0.19699732462565103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,16,power_law_1.01,0.21778559684753418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,16,power_law_1.01,0.22446079254150392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,16,power_law_1.2,0.21740798950195311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,16,power_law_1.2,0.22544000148773194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,2,balanced,0.9576106866200765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,2,balanced,0.9620160261789957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,2,power_law_1.01,0.6872640132904053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,2,power_law_1.01,0.7087488174438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,2,power_law_1.2,0.6337024211883545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,2,power_law_1.2,0.6826879978179932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,256,balanced,0.0636106679836909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,256,balanced,0.0664106657107671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,256,power_law_1.01,0.061612802743911746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,256,power_law_1.01,0.06416640281677247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,256,power_law_1.2,0.06550400257110596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,256,power_law_1.2,0.06636160016059875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,32,balanced,0.14499732851982117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,32,balanced,0.14718400438626608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,32,power_law_1.01,0.13628799915313722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,32,power_law_1.01,0.14453760385513306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,32,power_law_1.2,0.12483199834823608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,32,power_law_1.2,0.13749760389328003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,4,balanced,0.5234613418579102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,4,balanced,0.5244853496551514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,4,power_law_1.01,0.4237504005432129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,4,power_law_1.01,0.46562561988830564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,4,power_law_1.2,0.4552703857421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,4,power_law_1.2,0.47127041816711424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,64,balanced,0.09500267108281453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,64,balanced,0.09501866499582927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,64,power_law_1.01,0.08862720131874084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,64,power_law_1.01,0.08869760036468506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,64,power_law_1.2,0.08163840174674988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,64,power_law_1.2,0.08390399813652039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,8,balanced,0.30956266323725384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,8,balanced,0.31003199021021527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,8,power_law_1.01,0.35783679485321046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,8,power_law_1.01,0.35888640880584716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,8,power_law_1.2,0.33191680908203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,4096,2688,22,512,1,8,power_law_1.2,0.34371840953826904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,1,balanced,0.44682133197784424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,1,balanced,0.4501066605250041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,1,power_law_1.01,0.43935360908508303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,1,power_law_1.01,0.44744319915771485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,1,power_law_1.2,0.43853440284729006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,1,power_law_1.2,0.44519681930541993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,2,balanced,0.27510933081309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,2,balanced,0.3030719955762227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,2,power_law_1.01,0.2708031892776489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,2,power_law_1.01,0.2726016044616699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,2,power_law_1.2,0.268723201751709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,2,power_law_1.2,0.27167999744415283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,4,balanced,0.18863467375437418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,4,balanced,0.19141866763432822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,4,power_law_1.01,0.18793599605560302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,4,power_law_1.01,0.18812160491943358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,4,power_law_1.2,0.18731520175933838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,4,power_law_1.2,0.18804479837417604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,8,balanced,0.16055466731389365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,8,balanced,0.16191466649373373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,8,power_law_1.01,0.15955840349197387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,8,power_law_1.01,0.15976959466934204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,8,power_law_1.2,0.15961600542068483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,1,8,power_law_1.2,0.16528639793395997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,16,1,balanced,0.06993066767851512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,16,1,balanced,0.07043200234572093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,16,1,power_law_1.01,0.06707839965820313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,16,1,power_law_1.01,0.06757760047912598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,16,1,power_law_1.2,0.066975998878479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,16,1,power_law_1.2,0.06835839748382569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,2,1,balanced,0.23576533794403076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,2,1,balanced,0.23802665869394937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,2,1,power_law_1.01,0.2302464008331299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,2,1,power_law_1.01,0.23871359825134278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,2,1,power_law_1.2,0.2354111909866333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,2,1,power_law_1.2,0.23783679008483888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,32,1,balanced,0.05641066531340281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,32,1,balanced,0.05806399881839752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,32,1,power_law_1.01,0.05235840082168579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,32,1,power_law_1.01,0.05723519921302796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,32,1,power_law_1.2,0.055244797468185426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,32,1,power_law_1.2,0.05604479908943176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,4,1,balanced,0.13447999954223633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,4,1,balanced,0.16547733545303345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,4,1,power_law_1.01,0.13178240060806273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,4,1,power_law_1.01,0.13233920335769653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,4,1,power_law_1.2,0.12828799486160278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,4,1,power_law_1.2,0.1302847981452942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,8,1,balanced,0.09116799632708232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,8,1,balanced,0.09511466821034749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,8,1,power_law_1.01,0.08786560297012329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,8,1,power_law_1.01,0.08787840008735656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,8,1,power_law_1.2,0.08678399920463561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,16384,2,8,8,1,power_law_1.2,0.08725119829177856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,1,balanced,0.8060800234476725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,1,balanced,0.8079840342203776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,1,power_law_1.01,0.6244607925415039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,1,power_law_1.01,0.6393727779388427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,1,power_law_1.2,0.5661248207092285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,1,power_law_1.2,0.5687935829162598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,128,balanced,0.056143999099731445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,128,balanced,0.056559999783833824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,128,power_law_1.01,0.06135680079460144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,128,power_law_1.01,0.0654528021812439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,128,power_law_1.2,0.05909119844436646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,128,power_law_1.2,0.06502400040626526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,16,balanced,0.0981226662794749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,16,balanced,0.09914666414260864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,16,power_law_1.01,0.14229120016098024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,16,power_law_1.01,0.1435520052909851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,16,power_law_1.2,0.13449599742889404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,16,power_law_1.2,0.14045439958572387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,2,balanced,0.44021332263946533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,2,balanced,0.44207998116811115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,2,power_law_1.01,0.39673600196838377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,2,power_law_1.01,0.4051072120666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,2,power_law_1.2,0.35443840026855467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,2,power_law_1.2,0.37192959785461427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,256,balanced,0.05629333357016245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,256,balanced,0.058101331194241844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,256,power_law_1.01,0.05604479908943176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,256,power_law_1.01,0.057734400033950806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,256,power_law_1.2,0.056543999910354616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,256,power_law_1.2,0.0579584002494812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,32,balanced,0.07925333579381307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,32,balanced,0.08122133215268452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,32,power_law_1.01,0.09360640048980713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,32,power_law_1.01,0.09582719802856446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,32,power_law_1.2,0.089273601770401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,32,power_law_1.2,0.09440000057220459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,4,balanced,0.2400533358256022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,4,balanced,0.24024534225463867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,4,power_law_1.01,0.269215989112854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,4,power_law_1.01,0.29850881099700927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,4,power_law_1.2,0.24572160243988037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,4,power_law_1.2,0.28339200019836425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,64,balanced,0.06654933094978333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,64,balanced,0.0688266654809316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,64,power_law_1.01,0.0762112021446228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,64,power_law_1.01,0.07634559869766236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,64,power_law_1.2,0.07516800165176392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,64,power_law_1.2,0.07552639842033386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,8,balanced,0.14497066537539163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,8,balanced,0.14571733276049295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,8,power_law_1.01,0.20901761054992676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,8,power_law_1.01,0.2116863965988159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,8,power_law_1.2,0.22074239253997802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,1,8,power_law_1.2,0.22266879081726074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,16,1,balanced,0.11103467146555583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,16,1,balanced,0.11327999830245972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,16,1,power_law_1.01,0.09571840167045594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,16,1,power_law_1.01,0.09670400023460388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,16,1,power_law_1.2,0.09300479888916016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,16,1,power_law_1.2,0.09314560294151306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,2,1,balanced,0.43117864926656085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,2,1,balanced,0.43144532044728595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,2,1,power_law_1.01,0.3338239908218384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,2,1,power_law_1.01,0.3341504096984863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,2,1,power_law_1.2,0.30695040225982667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,2,1,power_law_1.2,0.31675519943237307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,4,1,balanced,0.24283732970555624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,4,1,balanced,0.24292800823847452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,4,1,power_law_1.01,0.21063680648803712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,4,1,power_law_1.01,0.21476480960845948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,4,1,power_law_1.2,0.1958016037940979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,4,1,power_law_1.2,0.20018560886383058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,8,1,balanced,0.18541866540908813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,8,1,balanced,0.1886826753616333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,8,1,power_law_1.01,0.13397120237350463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,8,1,power_law_1.01,0.1365056037902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,8,1,power_law_1.2,0.12003840208053589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2048,8,256,8,1,power_law_1.2,0.12490240335464478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,1,balanced,0.9962560335795084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,1,balanced,0.9978773593902588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,1,power_law_1.01,0.5921664237976074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,1,power_law_1.01,0.6034495830535889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,1,power_law_1.2,0.5574207782745362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,1,power_law_1.2,0.5580671787261963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,16,balanced,0.10847466190656026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,16,balanced,0.10930132865905762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,16,power_law_1.01,0.09948800206184387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,16,power_law_1.01,0.10364799499511719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,16,power_law_1.2,0.10085120201110839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,16,power_law_1.2,0.11331199407577515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,2,balanced,0.5367946624755859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,2,balanced,0.5408533414204916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,2,power_law_1.01,0.34652159214019773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,2,power_law_1.01,0.3640575885772705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,2,power_law_1.2,0.3157439947128296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,2,power_law_1.2,0.34708480834960936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,32,balanced,0.08642133076985677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,32,balanced,0.08780800302823384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,32,power_law_1.01,0.08593279719352723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,32,power_law_1.01,0.08899840116500854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,32,power_law_1.2,0.08479359745979309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,32,power_law_1.2,0.08584319949150085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,4,balanced,0.3044106761614482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,4,balanced,0.3063093423843384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,4,power_law_1.01,0.24324479103088378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,4,power_law_1.01,0.24583039283752442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,4,power_law_1.2,0.2133631944656372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,4,power_law_1.2,0.22120320796966553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,8,balanced,0.17685866355895996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,8,balanced,0.17707733313242593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,8,power_law_1.01,0.14706560373306274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,8,power_law_1.01,0.18551039695739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,8,power_law_1.2,0.17905919551849364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,1,8,power_law_1.2,0.18259840011596679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,2,1,balanced,0.5313546657562256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,2,1,balanced,0.533456007639567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,2,1,power_law_1.01,0.32911999225616456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,2,1,power_law_1.01,0.32931840419769287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,2,1,power_law_1.2,0.3048896074295044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,2,1,power_law_1.2,0.31580801010131837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,4,1,balanced,0.3051946759223938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,4,1,balanced,0.3067413369814555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,4,1,power_law_1.01,0.20470399856567384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,4,1,power_law_1.01,0.21109120845794677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,4,1,power_law_1.2,0.1926591992378235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,6144,2560,8,160,4,1,power_law_1.2,0.19405440092086793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,1,balanced,0.933130661646525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,1,balanced,0.9377226829528809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,1,power_law_1.01,0.7326464176177978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,1,power_law_1.01,0.7451583862304687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,1,power_law_1.2,0.6338240146636963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,1,power_law_1.2,0.6480447769165039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,128,balanced,0.06058666606744131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,128,balanced,0.0642133355140686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,128,power_law_1.01,0.07109119892120361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,128,power_law_1.01,0.07185919880867005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,128,power_law_1.2,0.07046399712562561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,128,power_law_1.2,0.07220479846000671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,16,balanced,0.10751466949780782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,16,balanced,0.1076639990011851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,16,power_law_1.01,0.15789439678192138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,16,power_law_1.2,0.15764479637145995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,16,power_law_1.2,0.15807360410690308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,2,balanced,0.5055573383967081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,2,balanced,0.5064640045166016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,2,power_law_1.01,0.4182079792022705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,2,power_law_1.01,0.465177583694458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,2,power_law_1.2,0.3609920024871826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,2,power_law_1.2,0.4363711833953857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,256,balanced,0.06198399762312571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,256,balanced,0.06389333307743073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,256,power_law_1.01,0.06229119896888733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,256,power_law_1.01,0.06316800117492676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,256,power_law_1.2,0.05982080101966858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,256,power_law_1.2,0.06046720147132874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,32,balanced,0.0876693328221639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,32,balanced,0.08827199538548787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,32,power_law_1.01,0.10065280199050904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,32,power_law_1.01,0.10575360059738159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,32,power_law_1.2,0.09773439764976502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,32,power_law_1.2,0.09983360171318054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,4,balanced,0.27484800418217975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,4,balanced,0.27828800678253174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,4,power_law_1.01,0.3151616096496582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,4,power_law_1.01,0.33632640838623046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,4,power_law_1.2,0.2998719930648804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,4,power_law_1.2,0.31075201034545896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,64,balanced,0.07643199960390727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,64,balanced,0.07734400033950806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,64,power_law_1.01,0.08022400140762329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,64,power_law_1.01,0.08151040077209473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,64,power_law_1.2,0.07987840175628662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,64,power_law_1.2,0.08045439720153809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,8,balanced,0.15947733322779337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,8,balanced,0.16084800163904825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,8,power_law_1.01,0.21392641067504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,8,power_law_1.01,0.251859188079834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,8,power_law_1.2,0.242956805229187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,1,8,power_law_1.2,0.24915199279785155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,16,1,balanced,0.1256586710611979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,16,1,balanced,0.12571199735005698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,16,1,power_law_1.01,0.10711040496826171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,16,1,power_law_1.01,0.10855679512023926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,16,1,power_law_1.2,0.10215679407119752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,16,1,power_law_1.2,0.1030784010887146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,2,1,balanced,0.49853865305582684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,2,1,balanced,0.49911999702453613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,2,1,power_law_1.01,0.3833343982696533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,2,1,power_law_1.01,0.3872384071350098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,2,1,power_law_1.2,0.35662078857421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,2,1,power_law_1.2,0.35884799957275393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,4,1,balanced,0.2814720074335734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,4,1,balanced,0.2821279962857564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,4,1,power_law_1.01,0.24778239727020263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,4,1,power_law_1.01,0.24976000785827637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,4,1,power_law_1.2,0.23509759902954103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,4,1,power_law_1.2,0.23756799697875977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,8,1,balanced,0.21346133947372437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,8,1,balanced,0.2170026699701945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,8,1,power_law_1.01,0.1503167986869812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,8,1,power_law_1.01,0.15085439682006835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,8,1,power_law_1.2,0.1400704026222229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,256,8,1,power_law_1.2,0.14214400053024293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,1,balanced,0.9437493483225504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,1,balanced,0.9547200202941895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,1,power_law_1.01,0.8536576271057129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,1,power_law_1.01,0.8664575576782226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,1,power_law_1.2,0.7678336143493653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,1,power_law_1.2,0.7721856117248536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,128,balanced,0.06012799839178721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,128,balanced,0.06397333244482677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,128,power_law_1.01,0.07748479843139648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,128,power_law_1.01,0.07951359748840332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,128,power_law_1.2,0.07740160226821899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,128,power_law_1.2,0.07994239926338195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,16,balanced,0.10738133390744527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,16,balanced,0.10795199871063232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,16,power_law_1.01,0.23816320896148682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,16,power_law_1.01,0.24401919841766356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,16,power_law_1.2,0.24007039070129393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,16,power_law_1.2,0.24576640129089355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,2,balanced,0.5107626517613729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,2,balanced,0.5119733413060507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,2,power_law_1.01,0.5389247894287109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,2,power_law_1.01,0.562995195388794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,2,power_law_1.2,0.5156608104705811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,2,power_law_1.2,0.5215487957000733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,32,balanced,0.08886399865150452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,32,balanced,0.08961066603660583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,32,power_law_1.01,0.13623679876327516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,32,power_law_1.01,0.13839999437332154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,32,power_law_1.2,0.13066879510879517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,32,power_law_1.2,0.1367616057395935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,4,balanced,0.27502934137980145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,4,balanced,0.2767680088678996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,4,power_law_1.01,0.3838399887084961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,4,power_law_1.01,0.38840320110321047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,4,power_law_1.2,0.3688960075378418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,4,power_law_1.2,0.38472959995269773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,64,balanced,0.07795733213424683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,64,balanced,0.07850666840871175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,64,power_law_1.01,0.09333760142326356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,64,power_law_1.01,0.09370880126953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,64,power_law_1.2,0.09185919761657715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,64,power_law_1.2,0.09388160109519958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,8,balanced,0.15892799695332846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,8,balanced,0.16158399979273477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,8,power_law_1.01,0.28287999629974364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,8,power_law_1.01,0.32102398872375487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,8,power_law_1.2,0.2798719882965088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,1,8,power_law_1.2,0.2987776041030884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,16,1,balanced,0.12428800264994304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,16,1,balanced,0.12468799948692322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,16,1,power_law_1.01,0.1139456033706665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,16,1,power_law_1.01,0.11431679725646973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,16,1,power_law_1.2,0.10806399583816528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,16,1,power_law_1.2,0.10856959819793702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,2,1,balanced,0.4965279897054036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,2,1,balanced,0.4973173141479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,2,1,power_law_1.01,0.44829440116882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,2,1,power_law_1.01,0.45821437835693357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,2,1,power_law_1.2,0.40247039794921874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,2,1,power_law_1.2,0.40595197677612305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,4,1,balanced,0.2797013322512309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,4,1,balanced,0.2804373304049174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,4,1,power_law_1.01,0.26029438972473146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,4,1,power_law_1.01,0.2629120111465454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,4,1,power_law_1.2,0.2511552095413208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,4,1,power_law_1.2,0.2533567905426025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,8,1,balanced,0.17324266831080118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,8,1,balanced,0.1755839983622233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,8,1,power_law_1.01,0.16331520080566406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,8,1,power_law_1.01,0.1642240047454834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,8,1,power_law_1.2,0.14728959798812866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16,7168,2048,8,384,8,1,power_law_1.2,0.15110399723052978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,1,balanced,0.1483466625213623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,1,balanced,0.14864533146222433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,1,power_law_1.01,0.1510975956916809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,1,power_law_1.01,0.15326720476150513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,1,power_law_1.2,0.1547968029975891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,1,power_law_1.2,0.1561792016029358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,128,balanced,0.05411200225353241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,128,balanced,0.05446400245030721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,128,power_law_1.01,0.05329279899597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,128,power_law_1.01,0.054048001766204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,128,power_law_1.2,0.05397120118141174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,128,power_law_1.2,0.054048001766204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,16,balanced,0.05996266504128774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,16,balanced,0.06195733447869619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,16,power_law_1.01,0.06039680242538452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,16,power_law_1.01,0.06046079993247986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,16,power_law_1.2,0.05982720255851746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,16,power_law_1.2,0.06117119789123535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,2,balanced,0.1425386667251587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,2,balanced,0.14403733611106873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,2,power_law_1.01,0.13857920169830323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,2,power_law_1.01,0.13886719942092896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,2,power_law_1.2,0.13936640024185182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,2,power_law_1.2,0.14083839654922486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,32,balanced,0.05783999959627787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,32,balanced,0.05871999760468801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,32,power_law_1.01,0.056934398412704465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,32,power_law_1.01,0.05699840188026428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,32,power_law_1.2,0.05687680244445801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,32,power_law_1.2,0.05753600001335144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,4,balanced,0.10255466898282369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,4,balanced,0.10409599542617798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,4,power_law_1.01,0.10061440467834473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,4,power_law_1.01,0.10087679624557495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,4,power_law_1.2,0.09745280146598816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,4,power_law_1.2,0.09831039905548096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,64,balanced,0.055573334296544395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,64,balanced,0.056688000758488975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,64,power_law_1.01,0.0536575973033905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,64,power_law_1.01,0.05454720258712768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,64,power_law_1.2,0.05451520085334778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,64,power_law_1.2,0.05484799742698669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,8,balanced,0.0695360004901886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,8,balanced,0.0721973329782486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,8,power_law_1.01,0.06990079879760742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,8,power_law_1.01,0.06991999745368957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,8,power_law_1.2,0.06779519915580749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,1,8,power_law_1.2,0.06896640062332153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,2,1,balanced,0.10206933816274007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,2,1,balanced,0.10328533252080281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,2,1,power_law_1.01,0.10853760242462158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,2,1,power_law_1.01,0.10978560447692871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,2,1,power_law_1.2,0.11013120412826538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,2048,768,8,128,2,1,power_law_1.2,0.1120959997177124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,1,balanced,1.0360693136850994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,1,balanced,1.036138693491618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,1,power_law_1.01,0.8830783843994141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,1,power_law_1.01,0.8971072196960449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,1,power_law_1.2,0.8857215881347656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,1,power_law_1.2,0.8896256446838379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,128,balanced,0.10388267040252686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,128,balanced,0.10532266894976298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,128,power_law_1.01,0.10163840055465698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,128,power_law_1.01,0.10241279602050782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,128,power_law_1.2,0.10176000595092774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,128,power_law_1.2,0.10238720178604126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,16,balanced,0.16234133640925089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,16,balanced,0.16265066464742026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,16,power_law_1.01,0.15232640504837036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,16,power_law_1.01,0.15591039657592773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,16,power_law_1.2,0.15155199766159058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,16,power_law_1.2,0.15597440004348756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,2,balanced,0.5699520111083984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,2,balanced,0.5717546542485555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,2,power_law_1.01,0.48645758628845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,2,power_law_1.01,0.5015168190002441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,2,power_law_1.2,0.4905792236328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,2,power_law_1.2,0.4944255828857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,256,balanced,0.10102400183677673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,256,balanced,0.10161599516868591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,256,power_law_1.01,0.09968640208244324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,256,power_law_1.01,0.09995520114898682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,256,power_law_1.2,0.10021120309829712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,256,power_law_1.2,0.10037120580673217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,32,balanced,0.12918399771054587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,32,balanced,0.13168533643086752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,32,power_law_1.01,0.12660479545593262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,32,power_law_1.01,0.12675199508666993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,32,power_law_1.2,0.1256832003593445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,32,power_law_1.2,0.1260800004005432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,4,balanced,0.34272531668345135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,4,balanced,0.34293333689371747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,4,power_law_1.01,0.30266880989074707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,4,power_law_1.01,0.31573119163513186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,4,power_law_1.2,0.28901119232177735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,4,power_law_1.2,0.2989952087402344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,64,balanced,0.11210667093594869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,64,balanced,0.11559999982515971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,64,power_law_1.01,0.10900479555130005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,64,power_law_1.01,0.11047040224075318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,64,power_law_1.2,0.1084928035736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,64,power_law_1.2,0.11085439920425415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,8,balanced,0.22143999735514322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,8,balanced,0.22288000583648682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,8,power_law_1.01,0.20786559581756592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,8,power_law_1.01,0.2094719886779785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,8,power_law_1.2,0.20097920894622803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,1,8,power_law_1.2,0.20832641124725343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,2,1,balanced,0.5799893140792847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,2,1,balanced,0.5802186727523804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,2,1,power_law_1.01,0.4897471904754639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,2,1,power_law_1.01,0.4958335876464844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,2,1,power_law_1.2,0.4884672164916992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,2,1,power_law_1.2,0.4897151947021484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,4,1,balanced,0.35199999809265137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,4,1,balanced,0.35225598017374676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,4,1,power_law_1.01,0.2999552011489868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,4,1,power_law_1.01,0.30370559692382815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,4,1,power_law_1.2,0.3009664058685303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,3072,1536,8,256,4,1,power_law_1.2,0.30227839946746826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,1,balanced,0.46820799509684247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,1,balanced,0.4684640169143677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,1,power_law_1.01,0.5919360160827637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,1,power_law_1.01,0.6244863986968994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,1,power_law_1.2,0.6144768238067627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,1,power_law_1.2,0.6237631797790527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,2,balanced,0.3394613265991211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,2,balanced,0.342682679494222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,2,power_law_1.01,0.3618367910385132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,2,power_law_1.01,0.3637248039245605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,2,power_law_1.2,0.3717504024505615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,2,power_law_1.2,0.39263999462127686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,4,balanced,0.27075199286142987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,4,balanced,0.271178662776947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,4,power_law_1.01,0.30931839942932127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,4,power_law_1.01,0.32249600887298585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,4,power_law_1.2,0.30711679458618163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,4,power_law_1.2,0.3166591882705688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,8,balanced,0.235317329565684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,8,balanced,0.23854400714238486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,8,power_law_1.01,0.2593024015426636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,8,power_law_1.01,0.2797823905944824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,8,power_law_1.2,0.2778815984725952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,1,8,power_law_1.2,0.2835903882980347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,16,1,balanced,0.07796266674995422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,16,1,balanced,0.08142933249473572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,16,1,power_law_1.01,0.08181120157241821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,16,1,power_law_1.01,0.08191360235214233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,16,1,power_law_1.2,0.08202239871025085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,16,1,power_law_1.2,0.08572160005569458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,2,1,balanced,0.2661653359731038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,2,1,balanced,0.2667679985364278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,2,1,power_law_1.01,0.33994240760803224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,2,1,power_law_1.01,0.3403072118759155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,2,1,power_law_1.2,0.32912640571594237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,2,1,power_law_1.2,0.3297600030899048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,4,1,balanced,0.15293866395950317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,4,1,balanced,0.15429332852363586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,4,1,power_law_1.01,0.17902719974517822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,4,1,power_law_1.01,0.1860416054725647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,4,1,power_law_1.2,0.1911296010017395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,4,1,power_law_1.2,0.19729280471801758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,8,1,balanced,0.09362666805585225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,8,1,balanced,0.0963253378868103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,8,1,power_law_1.01,0.12414079904556274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,8,1,power_law_1.01,0.12611199617385865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,8,1,power_law_1.2,0.11060479879379273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,14336,2,8,8,1,power_law_1.2,0.12645119428634644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,1,balanced,0.7134293715159098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,1,balanced,0.7140693664550781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,1,power_law_1.01,0.6687615871429443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,1,power_law_1.01,0.671289587020874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,1,power_law_1.2,0.6795519828796387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,1,power_law_1.2,0.6884928226470948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,128,balanced,0.0853653351465861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,128,balanced,0.08690667152404785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,128,power_law_1.01,0.0830847978591919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,128,power_law_1.01,0.08670079708099365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,128,power_law_1.2,0.08839679956436157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,128,power_law_1.2,0.08883839845657349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,16,balanced,0.11983999609947205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,16,balanced,0.12081600228945415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,16,power_law_1.01,0.11759999990463257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,16,power_law_1.01,0.12001919746398926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,16,power_law_1.2,0.11783679723739623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,16,power_law_1.2,0.11907839775085449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,2,balanced,0.411626656850179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,2,balanced,0.41229331493377686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,2,power_law_1.01,0.3682559967041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,2,power_law_1.01,0.3888256072998047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,2,power_law_1.2,0.4067967891693115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,2,power_law_1.2,0.40793600082397463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,32,balanced,0.10746133327484131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,32,balanced,0.10822400450706482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,32,power_law_1.01,0.10432000160217285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,32,power_law_1.01,0.1055232048034668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,32,power_law_1.2,0.10734720230102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,32,power_law_1.2,0.10830080509185791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,4,balanced,0.24121065934499106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,4,balanced,0.2421600023905436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,4,power_law_1.01,0.23571839332580566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,4,power_law_1.01,0.23713281154632568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,4,power_law_1.2,0.23909759521484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,4,power_law_1.2,0.24167039394378662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,64,balanced,0.0972053309281667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,64,balanced,0.09866133332252502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,64,power_law_1.01,0.09363200068473816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,64,power_law_1.01,0.0949504017829895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,64,power_law_1.2,0.09365119934082031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,64,power_law_1.2,0.1001471996307373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,8,balanced,0.16931732495625815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,8,balanced,0.1711626648902893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,8,power_law_1.01,0.16440320014953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,8,power_law_1.01,0.1667456030845642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,8,power_law_1.2,0.1618175983428955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,1,8,power_law_1.2,0.16998399496078492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,2,1,balanced,0.24658133586247763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,2,1,balanced,0.2471146583557129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,2,1,power_law_1.01,0.2628799915313721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,2,1,power_law_1.01,0.26391680240631105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,2,1,power_law_1.2,0.264467191696167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,2,1,power_law_1.2,0.26512000560760496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,4,1,balanced,0.16474666198094687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,4,1,balanced,0.1660319964090983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,4,1,power_law_1.01,0.18499840497970582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,4,1,power_law_1.01,0.18627840280532837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,4,1,power_law_1.2,0.18554240465164185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,1536,8,128,4,1,power_law_1.2,0.1858240008354187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,1,balanced,4.480725288391113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,1,balanced,4.483797391255696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,1,power_law_1.01,3.9966720581054687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,1,power_law_1.01,4.016793441772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,1,power_law_1.2,4.053286361694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,1,power_law_1.2,4.132902526855469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,128,balanced,0.31627732515335083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,128,balanced,0.31647467613220215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,128,power_law_1.01,0.3109823942184448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,128,power_law_1.01,0.31411840915679934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,128,power_law_1.2,0.3127680063247681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,128,power_law_1.2,0.3139647960662842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,16,balanced,0.5591626564661661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,16,balanced,0.5601973136266073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,16,power_law_1.01,0.5250624179840088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,16,power_law_1.01,0.5353280067443847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,16,power_law_1.2,0.5424448013305664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,16,power_law_1.2,0.549945592880249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,2,balanced,2.3957227071126304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,2,balanced,2.3969599405924478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,2,power_law_1.01,2.1339391708374023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,2,power_law_1.01,2.1910655975341795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,2,power_law_1.2,2.190265655517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,2,power_law_1.2,2.2107839584350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,256,balanced,0.29945600032806396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,256,balanced,0.2995786666870117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,256,power_law_1.01,0.2962944030761719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,256,power_law_1.01,0.2970815896987915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,256,power_law_1.2,0.29754879474639895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,256,power_law_1.2,0.29764480590820314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,32,balanced,0.4236053228378296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,32,balanced,0.42419731616973877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,32,power_law_1.01,0.41038079261779786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,32,power_law_1.01,0.41751680374145506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,32,power_law_1.2,0.40897278785705565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,32,power_law_1.2,0.4169919967651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,4,balanced,1.3501440684000652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,4,balanced,1.3517279624938965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,4,power_law_1.01,1.2330431938171387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,4,power_law_1.01,1.2402560234069824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,4,power_law_1.2,1.2462656021118164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,4,power_law_1.2,1.273203182220459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,64,balanced,0.3567359844843547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,64,balanced,0.3580160140991211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,64,power_law_1.01,0.34968318939208987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,64,power_law_1.01,0.3557568073272705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,64,power_law_1.2,0.35155839920043946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,64,power_law_1.2,0.3526144027709961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,8,balanced,0.8277813593546549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,8,balanced,0.8300213019053141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,8,power_law_1.01,0.7607808113098145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,8,power_law_1.01,0.7698112010955811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,8,power_law_1.2,0.7660863876342774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,4096,2688,22,512,1,8,power_law_1.2,0.7957248210906982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,1,balanced,0.7837866942087809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,1,balanced,0.7865813573201498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,1,power_law_1.01,0.8879551887512207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,1,power_law_1.01,0.9065343856811523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,1,power_law_1.2,0.87957763671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,1,power_law_1.2,0.8978367805480957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,2,balanced,0.4577813148498535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,2,balanced,0.45926932493845624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,2,power_law_1.01,0.5319615840911865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,2,power_law_1.01,0.6100927829742432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,2,power_law_1.2,0.5749504089355468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,2,power_law_1.2,0.6106048107147217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,4,balanced,0.339466651280721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,4,balanced,0.3402880032857259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,4,power_law_1.01,0.3956415891647339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,4,power_law_1.01,0.40488319396972655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,4,power_law_1.2,0.4051392078399658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,4,power_law_1.2,0.42308478355407714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,8,balanced,0.29029866059621173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,8,balanced,0.29042667150497437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,8,power_law_1.01,0.3537856101989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,8,power_law_1.01,0.3620415925979614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,8,power_law_1.2,0.3521728038787842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,1,8,power_law_1.2,0.3544447898864746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,16,1,balanced,0.1149066686630249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,16,1,balanced,0.11538133025169373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,16,1,power_law_1.01,0.11287039518356323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,16,1,power_law_1.01,0.11324800252914428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,16,1,power_law_1.2,0.11232000589370728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,16,1,power_law_1.2,0.11308799982070923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,2,1,balanced,0.43429867426554364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,2,1,balanced,0.43462932109832764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,2,1,power_law_1.01,0.4671807765960693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,2,1,power_law_1.01,0.4757631778717041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,2,1,power_law_1.2,0.46924800872802735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,2,1,power_law_1.2,0.4758272171020508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,32,1,balanced,0.09537600477536519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,32,1,balanced,0.09659199913342793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,32,1,power_law_1.01,0.09542400240898133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,32,1,power_law_1.01,0.09644160270690919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,32,1,power_law_1.2,0.09503359794616699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,32,1,power_law_1.2,0.09564800262451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,4,1,balanced,0.23677333196004233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,4,1,balanced,0.2660320003827413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,4,1,power_law_1.01,0.2723072052001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,4,1,power_law_1.01,0.27971839904785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,4,1,power_law_1.2,0.2801919937133789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,4,1,power_law_1.2,0.2804608106613159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,8,1,balanced,0.1377120018005371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,8,1,balanced,0.13949333628018698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,8,1,power_law_1.01,0.17480319738388062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,8,1,power_law_1.01,0.184825599193573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,8,1,power_law_1.2,0.17550079822540282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,16384,2,8,8,1,power_law_1.2,0.18428800106048585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,1,balanced,2.5579840342203775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,1,balanced,2.559999942779541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,1,power_law_1.01,2.138790321350098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,1,power_law_1.01,2.1823680877685545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,1,power_law_1.2,2.1548992156982423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,1,power_law_1.2,2.1698175430297852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,128,balanced,0.17325866222381592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,128,balanced,0.17358932892481485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,128,power_law_1.01,0.17175040245056153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,128,power_law_1.01,0.1724544048309326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,128,power_law_1.2,0.17123839855194092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,128,power_law_1.2,0.1726912021636963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,16,balanced,0.30371199051539105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,16,balanced,0.3037760059038798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,16,power_law_1.01,0.2869760036468506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,16,power_law_1.01,0.29134719371795653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,16,power_law_1.2,0.2907776117324829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,16,power_law_1.2,0.29351038932800294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,2,balanced,1.3524799346923828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,2,balanced,1.3529173533121746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,2,power_law_1.01,1.1697664260864258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,2,power_law_1.01,1.180844783782959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,2,power_law_1.2,1.1621503829956055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,2,power_law_1.2,1.1814656257629395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,256,balanced,0.1662560005982717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,256,balanced,0.16688533624013266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,256,power_law_1.01,0.16615040302276612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,256,power_law_1.01,0.1667904019355774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,256,power_law_1.2,0.16218240261077882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,256,power_law_1.2,0.1624575972557068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,32,balanced,0.22779732942581177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,32,balanced,0.22791467110315958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,32,power_law_1.01,0.2141632080078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,32,power_law_1.01,0.22277119159698486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,32,power_law_1.2,0.21964800357818604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,32,power_law_1.2,0.22287359237670898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,4,balanced,0.7593759695688883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,4,balanced,0.759984016418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,4,power_law_1.01,0.6708096027374267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,4,power_law_1.01,0.6910783767700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,4,power_law_1.2,0.6766208171844482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,4,power_law_1.2,0.6842879772186279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,64,balanced,0.1877866586049398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,64,balanced,0.18816532691319784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,64,power_law_1.01,0.18464640378952027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,64,power_law_1.01,0.1848703980445862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,64,power_law_1.2,0.1861248016357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,64,power_law_1.2,0.18655999898910522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,8,balanced,0.44990400473276776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,8,balanced,0.450981338818868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,8,power_law_1.01,0.40203518867492677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,8,power_law_1.01,0.40998401641845705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,8,power_law_1.2,0.4074880123138428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,1,8,power_law_1.2,0.43461761474609373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,16,1,balanced,0.34704001744588214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,16,1,balanced,0.34723734855651855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,16,1,power_law_1.01,0.31997439861297605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,16,1,power_law_1.01,0.32120959758758544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,16,1,power_law_1.2,0.3208064079284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,16,1,power_law_1.2,0.3244096040725708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,2,1,balanced,1.3615892728169758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,2,1,balanced,1.3635199864705403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,2,1,power_law_1.01,1.1531840324401856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,2,1,power_law_1.01,1.16627836227417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,2,1,power_law_1.2,1.1714559555053712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,2,1,power_law_1.2,1.1748543739318849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,4,1,balanced,0.46798932552337646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,4,1,balanced,0.4696640173594157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,4,1,power_law_1.01,0.41850881576538085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,4,1,power_law_1.01,0.42005119323730467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,4,1,power_law_1.2,0.4185023784637451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,4,1,power_law_1.2,0.42026238441467284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,8,1,balanced,0.2924746672312419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,8,1,balanced,0.29331199328104657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,8,1,power_law_1.01,0.2633280038833618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,8,1,power_law_1.01,0.26375041007995603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,8,1,power_law_1.2,0.2660928010940552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2048,8,256,8,1,power_law_1.2,0.2703808069229126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,1,balanced,2.0265280405680337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,1,balanced,2.026597340901693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,1,power_law_1.01,1.8641216278076171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,1,power_law_1.01,1.8708864212036134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,1,power_law_1.2,1.9105663299560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,1,power_law_1.2,1.9585216522216797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,16,balanced,0.25154133637746173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,16,balanced,0.2521226604779561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,16,power_law_1.01,0.2493824005126953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,16,power_law_1.01,0.24985599517822266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,16,power_law_1.2,0.2482815980911255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,16,power_law_1.2,0.2492288112640381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,2,balanced,1.0708853403727214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,2,balanced,1.0722453594207764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,2,power_law_1.01,1.0143936157226563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,2,power_law_1.01,1.0311552047729493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,2,power_law_1.2,1.0203583717346192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,2,power_law_1.2,1.021343994140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,32,balanced,0.18261865774790445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,32,balanced,0.18344533443450928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,32,power_law_1.01,0.18063360452651978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,32,power_law_1.01,0.18129279613494872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,32,power_law_1.2,0.18096640110015869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,32,power_law_1.2,0.18112000226974487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,4,balanced,0.43190399805704754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,4,balanced,0.43323198954264325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,4,power_law_1.01,0.40662398338317873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,4,power_law_1.01,0.4206079959869385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,4,power_law_1.2,0.4467775821685791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,4,power_law_1.2,0.4584320068359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,8,balanced,0.36393598715464276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,8,balanced,0.3657279809315999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,8,power_law_1.01,0.35393919944763186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,8,power_law_1.01,0.36355841159820557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,8,power_law_1.2,0.35475199222564696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,1,8,power_law_1.2,0.36015360355377196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,2,1,balanced,1.0747893651326497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,2,1,balanced,1.0756959915161133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,2,1,power_law_1.01,0.9787520408630371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,2,1,power_law_1.01,0.9899456024169921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,2,1,power_law_1.2,1.0039872169494628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,2,1,power_law_1.2,1.0367744445800782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,4,1,balanced,0.3655466636021932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,4,1,balanced,0.36638398965199787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,4,1,power_law_1.01,0.3650815963745117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,4,1,power_law_1.01,0.3690687894821167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,4,1,power_law_1.2,0.38261120319366454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,6144,2560,8,160,4,1,power_law_1.2,0.3855423927307129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,1,balanced,2.980064074198405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,1,balanced,2.9802185694376626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,1,power_law_1.01,2.4915199279785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,1,power_law_1.01,2.513107109069824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,1,power_law_1.2,2.5074111938476564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,1,power_law_1.2,2.5156671524047853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,128,balanced,0.1970026691754659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,128,balanced,0.1970400015513102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,128,power_law_1.01,0.19482879638671874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,128,power_law_1.01,0.19489279985427857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,128,power_law_1.2,0.1950719952583313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,128,power_law_1.2,0.19619840383529663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,16,balanced,0.34093332290649414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,16,balanced,0.3413493235905965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,16,power_law_1.01,0.3193023920059204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,16,power_law_1.01,0.32025599479675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,16,power_law_1.2,0.3149888038635254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,16,power_law_1.2,0.3254848003387451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,2,balanced,1.568112055460612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,2,balanced,1.569482644399007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,2,power_law_1.01,1.3226943969726563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,2,power_law_1.01,1.3865023612976075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,2,power_law_1.2,1.3274239540100097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,2,power_law_1.2,1.3387392044067383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,256,balanced,0.18857600291570029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,256,balanced,0.18933866421381632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,256,power_law_1.01,0.1870527982711792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,256,power_law_1.01,0.18835840225219727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,256,power_law_1.2,0.18703999519348144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,256,power_law_1.2,0.18732160329818726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,32,balanced,0.2527466615041097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,32,balanced,0.2528266708056132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,32,power_law_1.01,0.23226239681243896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,32,power_law_1.01,0.24169600009918213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,32,power_law_1.2,0.23915519714355468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,32,power_law_1.2,0.24600958824157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,4,balanced,0.8740106423695883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,4,balanced,0.8743840058644613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,4,power_law_1.01,0.7834112167358398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,4,power_law_1.01,0.7945600032806397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,4,power_law_1.2,0.7810495853424072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,4,power_law_1.2,0.7883456230163575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,64,balanced,0.20877333482106528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,64,balanced,0.20891199509302774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,64,power_law_1.01,0.20391039848327636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,64,power_law_1.01,0.2057408094406128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,64,power_law_1.2,0.2071552038192749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,64,power_law_1.2,0.2074496030807495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,8,balanced,0.5161333481470743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,8,balanced,0.5181386470794678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,8,power_law_1.01,0.4388288021087646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,8,power_law_1.01,0.48535680770874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,8,power_law_1.2,0.46639361381530764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,1,8,power_law_1.2,0.49672961235046387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,16,1,balanced,0.3999573389689128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,16,1,balanced,0.40097065766652423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,16,1,power_law_1.01,0.3671679973602295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,16,1,power_law_1.01,0.36925439834594725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,16,1,power_law_1.2,0.3711103916168213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,16,1,power_law_1.2,0.37387518882751464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,2,1,balanced,1.5845120747884114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,2,1,balanced,1.5846986770629883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,2,1,power_law_1.01,1.3562303543090821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,2,1,power_law_1.01,1.3782784461975097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,2,1,power_law_1.2,1.3560576438903809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,2,1,power_law_1.2,1.3582847595214844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,4,1,balanced,0.5491946538289388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,4,1,balanced,0.551584005355835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,4,1,power_law_1.01,0.4859456062316895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,4,1,power_law_1.01,0.49793281555175783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,4,1,power_law_1.2,0.4984127998352051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,4,1,power_law_1.2,0.4987135887145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,8,1,balanced,0.3356906572977702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,8,1,balanced,0.34015464782714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,8,1,power_law_1.01,0.29872000217437744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,8,1,power_law_1.01,0.30392959117889407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,8,1,power_law_1.2,0.2953216075897217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,256,8,1,power_law_1.2,0.303436803817749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,1,balanced,4.408730824788411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,1,balanced,4.411290804545085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,1,power_law_1.01,3.3978046417236327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,1,power_law_1.01,3.4417793273925783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,1,power_law_1.2,3.3115070343017576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,1,power_law_1.2,3.3745407104492187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,128,balanced,0.24975999196370444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,128,balanced,0.2502346634864807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,128,power_law_1.01,0.24777600765228272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,128,power_law_1.01,0.24841599464416503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,128,power_law_1.2,0.2477504014968872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,128,power_law_1.2,0.24776320457458495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,16,balanced,0.48398399353027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,16,balanced,0.48403199513753253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,16,power_law_1.01,0.42426238059997556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,16,power_law_1.01,0.45299839973449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,16,power_law_1.2,0.422105598449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,16,power_law_1.2,0.4309120178222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,2,balanced,2.3070507049560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,2,balanced,2.308997313181559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,2,power_law_1.01,1.887455940246582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,2,power_law_1.01,1.889241600036621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,2,power_law_1.2,1.8395584106445313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,2,power_law_1.2,1.8466432571411133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,32,balanced,0.3513866662979126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,32,balanced,0.3520053227742513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,32,power_law_1.01,0.3350271940231323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,32,power_law_1.01,0.3453439950942993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,32,power_law_1.2,0.32712318897247317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,32,power_law_1.2,0.33045120239257814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,4,balanced,1.268682638804118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,4,balanced,1.273408015569051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,4,power_law_1.01,1.0
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,4,power_law_1.01,1.102444839477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,4,power_law_1.2,0.9654911994934082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,4,power_law_1.2,1.0950016021728515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,64,balanced,0.28165332476298016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,64,balanced,0.2823626597722371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,64,power_law_1.01,0.27577600479125974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,64,power_law_1.01,0.27842559814453127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,64,power_law_1.2,0.2715840101242065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,64,power_law_1.2,0.2762495994567871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,8,balanced,0.75054931640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,8,balanced,0.7512319882710775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,8,power_law_1.01,0.6287295818328857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,8,power_law_1.01,0.6694655895233155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,8,power_law_1.2,0.6186304092407227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,1,8,power_law_1.2,0.640940809249878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,16,1,balanced,0.32419200738271076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,16,1,balanced,0.3269546627998352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,16,1,power_law_1.01,0.2527551889419556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,16,1,power_law_1.01,0.26106240749359133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,16,1,power_law_1.2,0.25790719985961913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,16,1,power_law_1.2,0.27198081016540526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,2,1,balanced,2.3314186731974282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,2,1,balanced,2.3330559730529785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,2,1,power_law_1.01,1.838547134399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,2,1,power_law_1.01,1.8674432754516601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,2,1,power_law_1.2,1.7941503524780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,2,1,power_law_1.2,1.8520000457763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,4,1,balanced,1.3218986988067627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,4,1,balanced,1.3255893389383953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,4,1,power_law_1.01,1.0400704383850097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,4,1,power_law_1.01,1.0556863784790038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,4,1,power_law_1.2,1.039731216430664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,4,1,power_law_1.2,1.0419391632080077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,8,1,balanced,0.4696799914042155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,8,1,balanced,0.4719253381093343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,8,1,power_law_1.01,0.3796479940414429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,8,1,power_law_1.01,0.383020806312561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,8,1,power_law_1.2,0.37879679203033445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,160,7168,2048,8,384,8,1,power_law_1.2,0.3789439916610718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,1,balanced,3.2851413091023765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,1,balanced,3.286074638366699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,1,power_law_1.01,3.1618751525878905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,1,power_law_1.01,3.1666048049926756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,1,power_law_1.2,3.1675647735595702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,1,power_law_1.2,3.169657516479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,128,balanced,1.2024479707082112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,128,balanced,1.2030346393585205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,128,power_law_1.01,1.334995174407959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,128,power_law_1.01,1.3802047729492188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,128,power_law_1.2,1.4429439544677733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,128,power_law_1.2,1.4567872047424317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,16,balanced,1.3314987023671467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,16,balanced,1.3341387112935383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,16,power_law_1.01,1.5113535881042481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,16,power_law_1.01,1.5360063552856444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,16,power_law_1.2,1.589023971557617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,16,power_law_1.2,1.7020671844482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,2,balanced,2.3463573455810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,2,balanced,2.3522987365722656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,2,power_law_1.01,2.414150428771973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,2,power_law_1.01,2.4390079498291017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,2,power_law_1.2,2.4650751113891602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,2,power_law_1.2,2.493612861633301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,32,balanced,1.2587733268737793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,32,balanced,1.259717305501302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,32,power_law_1.01,1.4034367561340333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,32,power_law_1.01,1.4400511741638184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,32,power_law_1.2,1.5210111618041993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,32,power_law_1.2,1.583289623260498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,4,balanced,1.769429365793864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,4,balanced,1.769477367401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,4,power_law_1.01,1.9498304367065429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,4,power_law_1.01,1.951456069946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,4,power_law_1.2,2.004102325439453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,4,power_law_1.2,2.0290687561035154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,64,balanced,1.2230239709218342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,64,balanced,1.2234453360239665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,64,power_law_1.01,1.3716544151306151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,64,power_law_1.01,1.3811776161193847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,64,power_law_1.2,1.4395392417907715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,64,power_law_1.2,1.516703987121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,8,balanced,1.4773279825846355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,8,balanced,1.4779307047526042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,8,power_law_1.01,1.6382272720336915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,8,power_law_1.01,1.6587648391723633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,8,power_law_1.2,1.8105215072631835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,1,8,power_law_1.2,1.8372735977172852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,2,1,balanced,2.000096003214518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,2,1,balanced,2.0001120567321777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,2,1,power_law_1.01,1.9813503265380858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,2,1,power_law_1.01,1.9842752456665038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,2,1,power_law_1.2,1.9818496704101562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,2048,768,8,128,2,1,power_law_1.2,1.9869312286376952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,1,balanced,8.315008163452148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,1,balanced,8.316170374552408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,1,power_law_1.01,8.264415740966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,1,power_law_1.01,8.277510070800782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,1,power_law_1.2,8.188441467285156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,1,power_law_1.2,8.222758483886718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,128,balanced,1.9941226641337078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,128,balanced,1.9948906898498535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,128,power_law_1.01,2.2167423248291014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,128,power_law_1.01,2.2762048721313475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,128,power_law_1.2,2.42224006652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,128,power_law_1.2,2.5019199371337892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,16,balanced,2.358837286631266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,16,balanced,2.359642664591471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,16,power_law_1.01,2.6869760513305665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,16,power_law_1.01,2.711052894592285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,16,power_law_1.2,2.775628852844238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,16,power_law_1.2,2.9777151107788087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,2,balanced,5.250250816345215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,2,balanced,5.2540585199991865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,2,power_law_1.01,5.4572288513183596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,2,power_law_1.01,5.719558334350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,2,power_law_1.2,5.458848190307617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,2,power_law_1.2,5.6460224151611325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,256,balanced,1.9648853937784831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,256,balanced,1.9679253896077473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,256,power_law_1.01,2.1656192779541015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,256,power_law_1.01,2.177356719970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,256,power_law_1.2,2.3596031188964846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,256,power_law_1.2,2.3704832077026365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,32,balanced,2.1524480183919272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,32,balanced,2.1534239451090493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,32,power_law_1.01,2.4440000534057615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,32,power_law_1.01,2.4682239532470702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,32,power_law_1.2,2.598297691345215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,32,power_law_1.2,2.7731903076171873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,4,balanced,3.6034825642903647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,4,balanced,3.606234550476074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,4,power_law_1.01,3.9353023529052735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,4,power_law_1.01,3.9851009368896486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,4,power_law_1.2,4.039104080200195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,4,power_law_1.2,4.225388717651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,64,balanced,2.04694398244222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,64,balanced,2.0476373036702475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,64,power_law_1.01,2.3128576278686523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,64,power_law_1.01,2.3917312622070312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,64,power_law_1.2,2.463417625427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,64,power_law_1.2,2.517625617980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,8,balanced,2.7765334447224936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,8,balanced,2.7773866653442383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,8,power_law_1.01,3.0219648361206053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,8,power_law_1.01,3.037913513183594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,8,power_law_1.2,3.1585599899291994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,1,8,power_law_1.2,3.4154624938964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,2,1,balanced,4.75761604309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,2,1,balanced,4.761269251505534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,2,1,power_law_1.01,4.693318557739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,2,1,power_law_1.01,4.70324478149414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,2,1,power_law_1.2,4.689279937744141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,2,1,power_law_1.2,4.689676666259766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,4,1,balanced,2.9340108235677085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,4,1,balanced,2.9349066416422525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,4,1,power_law_1.01,2.9118783950805662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,4,1,power_law_1.01,2.91778564453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,4,1,power_law_1.2,2.9150720596313477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,3072,1536,8,256,4,1,power_law_1.2,2.916556739807129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,1,balanced,21.056378682454426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,1,balanced,21.201712290445965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,1,power_law_1.01,21.514381408691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,1,power_law_1.01,21.563923645019532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,1,power_law_1.2,21.51553955078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,1,power_law_1.2,21.530712890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,2,balanced,12.235978444417318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,2,balanced,12.261685689290365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,2,power_law_1.01,15.52398681640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,2,power_law_1.01,16.11333770751953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,2,power_law_1.2,14.724038696289062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,2,power_law_1.2,15.915187072753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,4,balanced,7.750176111857097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,4,balanced,7.762261072794597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,4,power_law_1.01,12.197164916992188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,4,power_law_1.01,13.76561279296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,4,power_law_1.2,13.481765747070312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,4,power_law_1.2,13.486151123046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,8,balanced,5.495754877726237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,8,balanced,5.49617067972819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,8,power_law_1.01,11.391871643066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,8,power_law_1.01,12.214163208007813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,8,power_law_1.2,11.858099365234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,1,8,power_law_1.2,12.271526336669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,16,1,balanced,1.6983359654744465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,16,1,balanced,1.7006880442301433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,16,1,power_law_1.01,1.6738367080688477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,16,1,power_law_1.01,1.674553680419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,16,1,power_law_1.2,1.6694911956787108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,16,1,power_law_1.2,1.671334457397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,2,1,balanced,10.522997538248697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,2,1,balanced,10.52501360575358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,2,1,power_law_1.01,10.649075317382813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,2,1,power_law_1.01,10.675257873535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,2,1,power_law_1.2,10.685670471191406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,2,1,power_law_1.2,10.696985626220703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,4,1,balanced,5.401082356770833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,4,1,balanced,5.406848271687825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,4,1,power_law_1.01,5.415014266967773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,4,1,power_law_1.01,5.424505615234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,4,1,power_law_1.2,5.404153442382812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,4,1,power_law_1.2,5.4119873046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,8,1,balanced,2.903285344441732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,8,1,balanced,2.9069865544637046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,8,1,power_law_1.01,2.8593727111816407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,8,1,power_law_1.01,2.8653568267822265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,8,1,power_law_1.2,2.8626752853393556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,14336,2,8,8,1,power_law_1.2,2.8674816131591796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,1,balanced,10.28110376993815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,1,balanced,10.291162490844727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,1,power_law_1.01,9.923123168945313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,1,power_law_1.01,9.926220703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,1,power_law_1.2,9.841280364990235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,1,power_law_1.2,9.863967895507812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,128,balanced,2.230064074198405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,128,balanced,2.2361653645833335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,128,power_law_1.01,2.7000896453857424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,128,power_law_1.01,2.700217628479004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,128,power_law_1.2,3.100332832336426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,128,power_law_1.2,3.1055360794067384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,16,balanced,2.6937332153320312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,16,balanced,2.698181470235189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,16,power_law_1.01,3.203308868408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,16,power_law_1.01,3.2963390350341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,16,power_law_1.2,3.655660629272461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,16,power_law_1.2,3.757593536376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,2,balanced,6.3873335520426435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,2,balanced,6.3889923095703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,2,power_law_1.01,6.765811157226563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,2,power_law_1.01,6.918982696533203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,2,power_law_1.2,7.0934913635253904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,2,power_law_1.2,7.107942199707031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,32,balanced,2.4287840525309243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,32,balanced,2.4405760765075684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,32,power_law_1.01,2.9176511764526367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,32,power_law_1.01,3.0784191131591796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,32,power_law_1.2,3.250636672973633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,32,power_law_1.2,3.4502464294433595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,4,balanced,4.281205177307129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,4,balanced,4.284261385599772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,4,power_law_1.01,4.852793502807617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,4,power_law_1.01,4.887583923339844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,4,power_law_1.2,5.065561676025391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,4,power_law_1.2,5.100364685058594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,64,balanced,2.298634688059489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,64,balanced,2.304207960764567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,64,power_law_1.01,2.787187194824219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,64,power_law_1.01,2.8127487182617186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,64,power_law_1.2,3.086489677429199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,64,power_law_1.2,3.1627519607543944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,8,balanced,3.226463953653971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,8,balanced,3.229717254638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,8,power_law_1.01,3.8135616302490236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,8,power_law_1.01,3.8811904907226564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,8,power_law_1.2,4.409747314453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,1,8,power_law_1.2,4.562073516845703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,2,1,balanced,5.850538889567058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,2,1,balanced,5.857061386108398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,2,1,power_law_1.01,5.56682243347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,2,1,power_law_1.01,5.574297714233398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,2,1,power_law_1.2,5.5655872344970705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,2,1,power_law_1.2,5.571654510498047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,4,1,balanced,3.5781119664510093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,4,1,balanced,3.5798721313476562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,4,1,power_law_1.01,3.5216384887695313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,4,1,power_law_1.01,3.536441421508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,4,1,power_law_1.2,3.518483352661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,1536,8,128,4,1,power_law_1.2,3.5209983825683593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,1,balanced,47.4399668375651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,1,balanced,47.4540761311849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,1,power_law_1.01,47.49982604980469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,1,power_law_1.01,47.51786804199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,1,power_law_1.2,46.84101867675781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,1,power_law_1.2,46.961676025390624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,128,balanced,8.40179189046224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,128,balanced,8.403760274251303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,128,power_law_1.01,9.33356170654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,128,power_law_1.01,9.491776275634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,128,power_law_1.2,10.139878082275391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,128,power_law_1.2,10.330451202392577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,16,balanced,10.617669423421225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,16,balanced,10.63641611735026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,16,power_law_1.01,11.960569763183594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,16,power_law_1.01,12.189926147460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,16,power_law_1.2,12.894117736816407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,16,power_law_1.2,13.417996215820313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,2,balanced,28.18762715657552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,2,balanced,28.190256754557293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,2,power_law_1.01,28.940524291992187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,2,power_law_1.01,30.1
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,2,power_law_1.2,29.890484619140626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,2,power_law_1.2,31.240017700195313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,256,balanced,8.234432220458984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,256,balanced,8.262783686319986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,256,power_law_1.01,9.098892974853516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,256,power_law_1.01,9.110540771484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,256,power_law_1.2,10.134329223632813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,256,power_law_1.2,9.741260528564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,32,balanced,9.348762512207031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,32,balanced,9.351066589355469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,32,power_law_1.01,10.73367691040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,32,power_law_1.01,10.761280059814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,32,power_law_1.2,11.448441314697266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,32,power_law_1.2,11.8089599609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,4,balanced,18.172138214111328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,4,balanced,18.18230438232422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,4,power_law_1.01,19.532115173339843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,4,power_law_1.01,19.7482177734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,4,power_law_1.2,20.148570251464843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,4,power_law_1.2,20.66334686279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,64,balanced,8.714864095052084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,64,balanced,8.748485565185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,64,power_law_1.01,9.781791687011719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,64,power_law_1.01,9.876012420654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,64,power_law_1.2,10.372102355957031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,64,power_law_1.2,10.571769714355469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,8,balanced,13.157343546549479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,8,balanced,13.189125061035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,8,power_law_1.01,14.611769104003907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,8,power_law_1.01,15.222099304199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,8,power_law_1.2,15.394720458984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,4096,2688,22,512,1,8,power_law_1.2,15.549580383300782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,1,balanced,34.41863505045573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,1,balanced,34.47250111897787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,1,power_law_1.01,34.76744384765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,1,power_law_1.01,34.811865234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,1,power_law_1.2,34.73829650878906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,1,power_law_1.2,34.803994750976564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,2,balanced,19.126047770182293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,2,balanced,19.129348754882812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,2,power_law_1.01,25.589517211914064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,2,power_law_1.01,30.365158081054688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,2,power_law_1.2,23.257369995117188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,2,power_law_1.2,23.87291564941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,4,balanced,11.459184010823568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,4,balanced,11.465834299723307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,4,power_law_1.01,19.697727966308594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,4,power_law_1.01,20.608793640136717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,4,power_law_1.2,21.252230834960937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,4,power_law_1.2,21.30437774658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,8,balanced,7.617685317993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,8,balanced,7.622346878051758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,8,power_law_1.01,18.963046264648437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,8,power_law_1.01,19.116517639160158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,8,power_law_1.2,18.15894470214844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,1,8,power_law_1.2,18.963487243652345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,16,1,balanced,2.666149298350016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,16,1,balanced,2.6667467753092446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,16,1,power_law_1.01,2.622233581542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,16,1,power_law_1.01,2.6222463607788087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,16,1,power_law_1.2,2.6209535598754883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,16,1,power_law_1.2,2.622611236572266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,2,1,balanced,17.09159978230794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,2,1,balanced,17.121754964192707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,2,1,power_law_1.01,17.311538696289062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,2,1,power_law_1.01,17.32289276123047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,2,1,power_law_1.2,17.319398498535158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,2,1,power_law_1.2,17.358963012695312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,32,1,balanced,1.6958880424499512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,32,1,balanced,1.6958986918131511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,32,1,power_law_1.01,1.6648191452026366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,32,1,power_law_1.01,1.6680448532104493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,32,1,power_law_1.2,1.6641855239868164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,32,1,power_law_1.2,1.6711040496826173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,4,1,balanced,8.844751993815104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,4,1,balanced,8.850992202758789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,4,1,power_law_1.01,8.955903625488281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,4,1,power_law_1.01,8.970937347412109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,4,1,power_law_1.2,8.938495635986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,4,1,power_law_1.2,8.951731109619141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,8,1,balanced,4.677365303039551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,8,1,balanced,4.68609078725179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,8,1,power_law_1.01,4.679084777832031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,8,1,power_law_1.01,4.690348815917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,8,1,power_law_1.2,4.689497756958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,16384,2,8,8,1,power_law_1.2,4.694060897827148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,1,balanced,19.482554117838543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,1,balanced,19.486602783203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,1,power_law_1.01,20.136607360839843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,1,power_law_1.01,20.160121154785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,1,power_law_1.2,19.975584411621092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,1,power_law_1.2,20.007225036621094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,128,balanced,3.1918506622314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,128,balanced,3.2016798655192056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,128,power_law_1.01,3.801068878173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,128,power_law_1.01,3.8830718994140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,128,power_law_1.2,4.358303833007812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,128,power_law_1.2,4.615091323852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,16,balanced,4.124160130818685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,16,balanced,4.142421404520671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,16,power_law_1.01,4.939897537231445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,16,power_law_1.01,4.986329650878906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,16,power_law_1.2,5.676300811767578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,16,power_law_1.2,5.819769668579101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,2,balanced,11.516063690185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,2,balanced,11.519371032714844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,2,power_law_1.01,12.225753784179688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,2,power_law_1.01,13.259698486328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,2,power_law_1.2,12.511449432373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,2,power_law_1.2,12.698169708251953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,256,balanced,3.126293182373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,256,balanced,3.1280800501505532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,256,power_law_1.01,3.6141311645507814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,256,power_law_1.01,3.6227455139160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,256,power_law_1.2,4.255302429199219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,256,power_law_1.2,4.343833541870117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,32,balanced,3.598613421122233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,32,balanced,3.598965326944987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,32,power_law_1.01,4.3685760498046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,32,power_law_1.01,4.4786113739013675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,32,power_law_1.2,4.829254531860352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,32,power_law_1.2,4.940499114990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,4,balanced,7.312735875447591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,4,balanced,7.325471878051758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,4,power_law_1.01,8.459744262695313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,4,power_law_1.01,9.052748870849609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,4,power_law_1.2,8.403916931152343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,4,power_law_1.2,8.725593566894531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,64,balanced,3.330890655517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,64,balanced,3.3362134297688804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,64,power_law_1.01,4.1341503143310545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,64,power_law_1.01,4.1352191925048825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,64,power_law_1.2,4.720064163208008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,64,power_law_1.2,4.7417854309082035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,8,balanced,4.895663897196452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,8,balanced,4.898367881774902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,8,power_law_1.01,6.01440658569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,8,power_law_1.01,6.228761672973633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,8,power_law_1.2,6.316831970214844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,1,8,power_law_1.2,6.790815734863282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,16,1,balanced,3.271365483601888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,16,1,balanced,3.2725547154744468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,16,1,power_law_1.01,3.313484954833984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,16,1,power_law_1.01,3.3167423248291015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,16,1,power_law_1.2,3.3246654510498046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,16,1,power_law_1.2,3.3376129150390623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,2,1,balanced,10.738875071207682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,2,1,balanced,10.74569574991862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,2,1,power_law_1.01,10.87570571899414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,2,1,power_law_1.01,10.881446075439452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,2,1,power_law_1.2,10.72735366821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,2,1,power_law_1.2,10.758681488037109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,4,1,balanced,6.146954854329427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,4,1,balanced,6.148431777954102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,4,1,power_law_1.01,6.411705780029297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,4,1,power_law_1.01,6.411955261230469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,4,1,power_law_1.2,6.441407775878906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,4,1,power_law_1.2,6.443360137939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,8,1,balanced,8.555322647094727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,8,1,balanced,8.557402928670248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,8,1,power_law_1.01,8.657305908203124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,8,1,power_law_1.01,8.671186828613282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,8,1,power_law_1.2,8.696038055419923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2048,8,256,8,1,power_law_1.2,8.700083160400391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,1,balanced,23.891306559244793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,1,balanced,23.914756774902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,1,power_law_1.01,23.73326721191406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,1,power_law_1.01,23.73838653564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,1,power_law_1.2,23.55303039550781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,1,power_law_1.2,23.610202026367187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,16,balanced,4.714357376098633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,16,balanced,4.722336133321126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,16,power_law_1.01,6.185651016235352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,16,power_law_1.01,6.533395385742187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,16,power_law_1.2,6.66522216796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,16,power_law_1.2,7.0894721984863285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,2,balanced,13.88584009806315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,2,balanced,13.88696034749349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,2,power_law_1.01,14.446694946289062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,2,power_law_1.01,14.877159118652344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,2,power_law_1.2,14.85440673828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,2,power_law_1.2,16.357318115234374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,32,balanced,4.043642679850261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,32,balanced,4.046501477559407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,32,power_law_1.01,5.347200012207031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,32,power_law_1.01,6.302201461791992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,32,power_law_1.2,6.082022476196289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,32,power_law_1.2,6.2965953826904295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,4,balanced,8.273658752441406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,4,balanced,8.275418599446615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,4,power_law_1.01,10.309587097167968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,4,power_law_1.01,10.34136962890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,4,power_law_1.2,10.767072296142578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,4,power_law_1.2,10.787916564941407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,8,balanced,5.815392176310222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,8,balanced,5.817056020100911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,8,power_law_1.01,7.327833557128907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,8,power_law_1.01,7.688294219970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,8,power_law_1.2,8.681491088867187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,1,8,power_law_1.2,9.46740493774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,2,1,balanced,12.906959533691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,2,1,balanced,12.908138275146484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,2,1,power_law_1.01,12.600012969970702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,2,1,power_law_1.01,12.608102416992187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,2,1,power_law_1.2,12.462534332275391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,2,1,power_law_1.2,12.493638610839843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,4,1,balanced,7.237514495849609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,4,1,balanced,7.24128532409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,4,1,power_law_1.01,7.1521858215332035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,4,1,power_law_1.01,7.1676483154296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,4,1,power_law_1.2,7.160915374755859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,6144,2560,8,160,4,1,power_law_1.2,7.1684417724609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,1,balanced,22.45183563232422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,1,balanced,22.465370178222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,1,power_law_1.01,23.316864013671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,1,power_law_1.01,23.331634521484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,1,power_law_1.2,23.192723083496094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,1,power_law_1.2,23.212384033203126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,128,balanced,3.4644638697306314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,128,balanced,3.4699840545654297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,128,power_law_1.01,4.294047927856445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,128,power_law_1.01,4.314822387695313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,128,power_law_1.2,5.036352157592773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,128,power_law_1.2,5.31383056640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,16,balanced,4.562645276387532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,16,balanced,4.563285191853841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,16,power_law_1.01,5.590995025634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,16,power_law_1.01,5.831257629394531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,16,power_law_1.2,6.233401489257813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,16,power_law_1.2,7.122195434570313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,2,balanced,13.174560546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,2,balanced,13.199092864990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,2,power_law_1.01,14.551097106933593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,2,power_law_1.01,14.551808166503907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,2,power_law_1.2,14.462669372558594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,2,power_law_1.2,15.180928039550782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,256,balanced,3.3849865595499673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,256,balanced,3.390181223551432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,256,power_law_1.01,3.9721664428710937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,256,power_law_1.01,4.037740707397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,256,power_law_1.2,4.709363174438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,256,power_law_1.2,4.770732879638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,32,balanced,3.94162654876709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,32,balanced,3.9430131912231445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,32,power_law_1.01,4.765407943725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,32,power_law_1.01,4.975027084350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,32,power_law_1.2,5.501171112060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,32,power_law_1.2,5.6666816711425785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,4,balanced,8.27291170756022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,4,balanced,8.283962885538736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,4,power_law_1.01,9.396966552734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,4,power_law_1.01,9.572621154785157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,4,power_law_1.2,10.693260955810548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,4,power_law_1.2,9.871424102783203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,64,balanced,3.6254399617513022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,64,balanced,3.635845184326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,64,power_law_1.01,4.530387115478516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,64,power_law_1.01,4.674399948120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,64,power_law_1.2,5.101177597045899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,64,power_law_1.2,5.1630912780761715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,8,balanced,5.516730626424153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,8,balanced,5.521626790364583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,8,power_law_1.01,6.702310180664062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,8,power_law_1.01,6.807321929931641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,8,power_law_1.2,7.902342224121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,1,8,power_law_1.2,8.204351806640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,16,1,balanced,3.7695465087890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,16,1,balanced,3.773530642191569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,16,1,power_law_1.01,3.836640167236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,16,1,power_law_1.01,3.845337677001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,16,1,power_law_1.2,3.876844787597656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,16,1,power_law_1.2,3.8768768310546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,2,1,balanced,12.430213928222656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,2,1,balanced,12.446698506673178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,2,1,power_law_1.01,12.62693099975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,2,1,power_law_1.01,12.639405059814454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,2,1,power_law_1.2,12.472390747070312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,2,1,power_law_1.2,12.50929946899414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,4,1,balanced,7.093461354573567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,4,1,balanced,7.0967254638671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,4,1,power_law_1.01,7.357574462890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,4,1,power_law_1.01,7.377798461914063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,4,1,power_law_1.2,7.39697265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,4,1,power_law_1.2,7.425395202636719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,8,1,balanced,9.942997614542643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,8,1,balanced,9.957738876342773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,8,1,power_law_1.01,10.071705627441407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,8,1,power_law_1.01,10.085164642333984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,8,1,power_law_1.2,10.10552978515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,256,8,1,power_law_1.2,10.108582305908204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,1,balanced,25.142799377441406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,1,balanced,25.159156799316406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,1,power_law_1.01,24.402053833007812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,1,power_law_1.01,24.46112060546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,1,power_law_1.2,24.472557067871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,1,power_law_1.2,24.545843505859374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,128,balanced,3.5439891815185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,128,balanced,3.5488640467325845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,128,power_law_1.01,4.169068908691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,128,power_law_1.01,4.2417854309082035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,128,power_law_1.2,4.474240112304687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,128,power_law_1.2,4.784051132202149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,16,balanced,4.771610577901204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,16,balanced,4.777983983357747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,16,power_law_1.01,5.674105453491211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,16,power_law_1.01,5.79246711730957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,16,power_law_1.2,6.704351806640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,16,power_law_1.2,6.846828460693359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,2,balanced,14.53268814086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,2,balanced,14.543200174967447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,2,power_law_1.01,14.827655029296874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,2,power_law_1.01,15.516755676269531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,2,power_law_1.2,14.876422119140624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,2,power_law_1.2,15.706405639648438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,32,balanced,4.078250567118327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,32,balanced,4.078346570332845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,32,power_law_1.01,4.758291244506836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,32,power_law_1.01,4.978444671630859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,32,power_law_1.2,5.253657531738281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,32,power_law_1.2,5.313785552978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,4,balanced,8.970736185709635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,4,balanced,8.99501864115397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,4,power_law_1.01,10.104045104980468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,4,power_law_1.01,9.563699340820312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,4,power_law_1.2,10.038054656982421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,4,power_law_1.2,10.058150482177734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,64,balanced,3.716869354248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,64,balanced,3.722506523132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,64,power_law_1.01,4.39428482055664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,64,power_law_1.01,4.475660705566407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,64,power_law_1.2,4.773292922973633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,64,power_law_1.2,4.908377456665039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,8,balanced,6.184672037760417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,8,balanced,6.188165028889974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,8,power_law_1.01,6.940447998046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,8,power_law_1.01,7.028755187988281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,8,power_law_1.2,7.296498870849609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,1,8,power_law_1.2,7.494636535644531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,16,1,balanced,4.654826800028483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,16,1,balanced,4.660928090413411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,16,1,power_law_1.01,4.76769905090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,16,1,power_law_1.01,4.778195190429687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,16,1,power_law_1.2,4.807340621948242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,16,1,power_law_1.2,4.823187255859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,2,1,balanced,13.801514943440756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,2,1,balanced,13.802970886230469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,2,1,power_law_1.01,13.315699768066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,2,1,power_law_1.01,13.350111389160157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,2,1,power_law_1.2,13.249734497070312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,2,1,power_law_1.2,13.280288696289062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,4,1,balanced,8.194986979166666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,4,1,balanced,8.197258631388346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,4,1,power_law_1.01,7.781433868408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,4,1,power_law_1.01,7.7928321838378904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,4,1,power_law_1.2,7.786630249023437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,4,1,power_law_1.2,7.79254379272461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,8,1,balanced,5.338986714680989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,8,1,balanced,5.342997233072917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,8,1,power_law_1.01,5.165139389038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,8,1,power_law_1.01,5.180614471435547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,8,1,power_law_1.2,5.185875320434571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,16384,7168,2048,8,384,8,1,power_law_1.2,5.189427185058594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,1,balanced,0.14825600385665894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,1,balanced,0.15035733580589294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,1,power_law_1.01,0.15735039710998536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,1,power_law_1.01,0.15872000455856322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,1,power_law_1.2,0.15897599458694459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,1,power_law_1.2,0.1597440004348755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,128,balanced,0.05481066803137461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,128,balanced,0.0562666654586792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,128,power_law_1.01,0.055078399181365964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,128,power_law_1.01,0.05571200251579285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,128,power_law_1.2,0.05532159805297852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,128,power_law_1.2,0.055820798873901366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,16,balanced,0.06162666777769724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,16,balanced,0.06249066690603892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,16,power_law_1.01,0.06224640011787415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,16,power_law_1.01,0.06286720037460328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,16,power_law_1.2,0.06094719767570496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,16,power_law_1.2,0.0616703987121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,2,balanced,0.14455999930699667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,2,balanced,0.14470932881037393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,2,power_law_1.01,0.14046080112457277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,2,power_law_1.01,0.14120320081710816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,2,power_law_1.2,0.1414720058441162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,2,power_law_1.2,0.14716800451278686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,32,balanced,0.05825066566467285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,32,balanced,0.0587360014518102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,32,power_law_1.01,0.057817602157592775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,32,power_law_1.01,0.05804799795150757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,32,power_law_1.2,0.05807999968528747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,32,power_law_1.2,0.05899519920349121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,4,balanced,0.10466667016347249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,4,balanced,0.10493333141009013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,4,power_law_1.01,0.10243840217590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,4,power_law_1.01,0.10347520112991333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,4,power_law_1.2,0.10423040390014648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,4,power_law_1.2,0.10592000484466553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,64,balanced,0.05412266651789347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,64,balanced,0.05490666627883911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,64,power_law_1.01,0.05538560152053833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,64,power_law_1.01,0.057196801900863646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,64,power_law_1.2,0.05688959956169128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,64,power_law_1.2,0.05787519812583923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,8,balanced,0.07127466797828674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,8,balanced,0.07249066730340321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,8,power_law_1.01,0.070387202501297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,8,power_law_1.01,0.07071999907493591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,8,power_law_1.2,0.06941440105438232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,1,8,power_law_1.2,0.06999040246009827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,2,1,balanced,0.10345066587130229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,2,1,balanced,0.10402133067448933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,2,1,power_law_1.01,0.115174400806427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,2,1,power_law_1.01,0.1165887951850891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,2,1,power_law_1.2,0.11391999721527099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,2048,768,8,128,2,1,power_law_1.2,0.11662080287933349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,1,balanced,1.043386697769165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,1,balanced,1.0436000029246013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,1,power_law_1.01,0.8924032211303711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,1,power_law_1.01,0.9102208137512207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,1,power_law_1.2,0.8779328346252442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,1,power_law_1.2,0.8934975624084472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,128,balanced,0.10645866394042969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,128,balanced,0.10705600182215373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,128,power_law_1.01,0.10519039630889893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,128,power_law_1.01,0.10537600517272949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,128,power_law_1.2,0.10554239749908448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,128,power_law_1.2,0.10575360059738159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,16,balanced,0.16432000199953714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,16,balanced,0.16495999693870544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,16,power_law_1.01,0.15886720418930053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,16,power_law_1.01,0.15892479419708253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,16,power_law_1.2,0.15913599729537964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,16,power_law_1.2,0.1595136046409607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,2,balanced,0.5758613348007202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,2,balanced,0.5774346590042114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,2,power_law_1.01,0.5181248188018799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,2,power_law_1.01,0.5188096046447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,2,power_law_1.2,0.499948787689209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,2,power_law_1.2,0.5075456142425537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,256,balanced,0.1051093339920044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,256,balanced,0.1053653359413147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,256,power_law_1.01,0.10285439491271972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,256,power_law_1.01,0.10340479612350464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,256,power_law_1.2,0.10342400074005127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,256,power_law_1.2,0.10362880229949951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,32,balanced,0.13159466783205667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,32,balanced,0.13421333829561868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,32,power_law_1.01,0.12940800189971924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,32,power_law_1.01,0.13040640354156494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,32,power_law_1.2,0.12865920066833497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,32,power_law_1.2,0.13007359504699706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,4,balanced,0.34488534927368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,4,balanced,0.3458186785380046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,4,power_law_1.01,0.3089792013168335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,4,power_law_1.01,0.32160000801086425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,4,power_law_1.2,0.31320960521698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,4,power_law_1.2,0.3243904113769531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,64,balanced,0.11563733220100403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,64,balanced,0.11683733264605205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,64,power_law_1.01,0.11230080127716065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,64,power_law_1.01,0.11488640308380127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,64,power_law_1.2,0.11114879846572875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,64,power_law_1.2,0.11344640254974366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,8,balanced,0.22576000293095908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,8,balanced,0.22609599431355795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,8,power_law_1.01,0.21146879196166993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,8,power_law_1.01,0.21425280570983887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,8,power_law_1.2,0.20307838916778564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,1,8,power_law_1.2,0.2128767967224121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,2,1,balanced,0.5816906690597534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,2,1,balanced,0.5822986761728922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,2,1,power_law_1.01,0.5049344062805176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,2,1,power_law_1.01,0.5145023822784424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,2,1,power_law_1.2,0.4938176155090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,2,1,power_law_1.2,0.505567979812622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,4,1,balanced,0.3526080052057902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,4,1,balanced,0.3535199960072835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,4,1,power_law_1.01,0.30423679351806643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,4,1,power_law_1.01,0.30538239479064944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,4,1,power_law_1.2,0.3061376094818115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,3072,1536,8,256,4,1,power_law_1.2,0.30680320262908933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,1,balanced,0.4757546583811442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,1,balanced,0.47631998856862384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,1,power_law_1.01,0.6003071784973144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,1,power_law_1.01,0.6477375984191894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,1,power_law_1.2,0.6486015796661377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,1,power_law_1.2,0.6553408145904541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,2,balanced,0.3458826541900635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,2,balanced,0.34623467922210693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,2,power_law_1.01,0.386406397819519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,2,power_law_1.01,0.3996864080429077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,2,power_law_1.2,0.3919872045516968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,2,power_law_1.2,0.4041088104248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,4,balanced,0.2765173316001892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,4,balanced,0.27673067649205524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,4,power_law_1.01,0.31692800521850584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,4,power_law_1.01,0.32780799865722654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,4,power_law_1.2,0.3330048084259033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,4,power_law_1.2,0.33571200370788573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,8,balanced,0.24196799596150717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,8,balanced,0.24305067459742227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,8,power_law_1.01,0.28378241062164306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,8,power_law_1.01,0.2962559938430786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,8,power_law_1.2,0.27809278964996337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,1,8,power_law_1.2,0.2908992052078247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,16,1,balanced,0.08063466846942902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,16,1,balanced,0.08080533146858215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,16,1,power_law_1.01,0.08298239707946778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,16,1,power_law_1.01,0.08519039750099182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,16,1,power_law_1.2,0.08629760146141052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,16,1,power_law_1.2,0.08938239812850952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,2,1,balanced,0.2722559968630473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,2,1,balanced,0.2732800046602885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,2,1,power_law_1.01,0.34586238861083984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,2,1,power_law_1.01,0.3497215986251831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,2,1,power_law_1.2,0.3498879909515381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,2,1,power_law_1.2,0.3504575967788696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,4,1,balanced,0.15656532843907675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,4,1,balanced,0.1567306617895762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,4,1,power_law_1.01,0.2067392110824585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,4,1,power_law_1.01,0.21060481071472167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,4,1,power_law_1.2,0.19946880340576173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,4,1,power_law_1.2,0.20549120903015136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,8,1,balanced,0.09547199805577596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,8,1,balanced,0.09903466701507568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,8,1,power_law_1.01,0.13473279476165773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,8,1,power_law_1.01,0.14076160192489623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,8,1,power_law_1.2,0.12856320142745972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,14336,2,8,8,1,power_law_1.2,0.13471360206604005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,1,balanced,0.7197226683298746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,1,balanced,0.7203786373138428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,1,power_law_1.01,0.6823232173919678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,1,power_law_1.01,0.6871424198150635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,1,power_law_1.2,0.7063231945037842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,1,power_law_1.2,0.71244797706604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,128,balanced,0.08858666817347209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,128,balanced,0.09220266342163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,128,power_law_1.01,0.08910080194473266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,128,power_law_1.01,0.09171199798583984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,128,power_law_1.2,0.0939199984073639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,128,power_law_1.2,0.0946943998336792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,16,balanced,0.1258080005645752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,16,balanced,0.12613866726557413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,16,power_law_1.01,0.12273279428482056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,16,power_law_1.01,0.1233407974243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,16,power_law_1.2,0.12317440509796143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,16,power_law_1.2,0.12440320253372192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,2,balanced,0.4166773160298665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,2,balanced,0.418506662050883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,2,power_law_1.01,0.3852799892425537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,2,power_law_1.01,0.3861567974090576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,2,power_law_1.2,0.4131584167480469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,2,power_law_1.2,0.41756157875061034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,32,balanced,0.1116426686445872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,32,balanced,0.11300266782442729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,32,power_law_1.01,0.11156480312347412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,32,power_law_1.01,0.11176320314407348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,32,power_law_1.2,0.11295360326766968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,32,power_law_1.2,0.11352959871292115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,4,balanced,0.24588799476623535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,4,balanced,0.24604799350102743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,4,power_law_1.01,0.2437056064605713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,4,power_law_1.01,0.2458240032196045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,4,power_law_1.2,0.2463167905807495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,4,power_law_1.2,0.2499840021133423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,64,balanced,0.1014400025208791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,64,balanced,0.10254933436711629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,64,power_law_1.01,0.10096640586853027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,64,power_law_1.01,0.10442880392074586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,64,power_law_1.2,0.10325119495391846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,64,power_law_1.2,0.10559359788894654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,8,balanced,0.1744426687558492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,8,balanced,0.17484800020853677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,8,power_law_1.01,0.17312639951705933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,8,power_law_1.01,0.1740991950035095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,8,power_law_1.2,0.16826879978179932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,1,8,power_law_1.2,0.16834559440612792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,2,1,balanced,0.24879467487335205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,2,1,balanced,0.2515466610590617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,2,1,power_law_1.01,0.27275519371032714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,2,1,power_law_1.01,0.27370879650115965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,2,1,power_law_1.2,0.2764863967895508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,2,1,power_law_1.2,0.28041601181030273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,4,1,balanced,0.16768532991409302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,4,1,balanced,0.1694613297780355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,4,1,power_law_1.01,0.19456000328063966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,4,1,power_law_1.01,0.19512959718704223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,4,1,power_law_1.2,0.19729280471801758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,1536,8,128,4,1,power_law_1.2,0.19953919649124147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,1,balanced,4.511301358540853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,1,balanced,4.515647888183594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,1,power_law_1.01,4.053593444824219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,1,power_law_1.01,4.095750427246093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,1,power_law_1.2,4.198598480224609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,1,power_law_1.2,4.204121780395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,128,balanced,0.33406933148701984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,128,balanced,0.3344053427378337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,128,power_law_1.01,0.3321471929550171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,128,power_law_1.01,0.33242239952087405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,128,power_law_1.2,0.3292288064956665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,128,power_law_1.2,0.33267199993133545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,16,balanced,0.580618659655253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,16,balanced,0.5817013184229533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,16,power_law_1.01,0.5562687873840332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,16,power_law_1.01,0.5678400039672852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,16,power_law_1.2,0.5649856090545654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,16,power_law_1.2,0.5704256057739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,2,balanced,2.4243253072102866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,2,balanced,2.4260640144348145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,2,power_law_1.01,2.191769599914551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,2,power_law_1.01,2.253440093994141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,2,power_law_1.2,2.2444671630859374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,2,power_law_1.2,2.257094383239746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,256,balanced,0.3161546587944031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,256,balanced,0.31758934259414673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,256,power_law_1.01,0.31372799873352053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,256,power_law_1.01,0.3150784015655518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,256,power_law_1.2,0.315449595451355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,256,power_law_1.2,0.3155776023864746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,32,balanced,0.44310931364695233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,32,balanced,0.4455946683883667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,32,power_law_1.01,0.4279488086700439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,32,power_law_1.01,0.4421567916870117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,32,power_law_1.2,0.4360832214355469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,32,power_law_1.2,0.43865599632263186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,4,balanced,1.3752800623575847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,4,balanced,1.3781013488769531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,4,power_law_1.01,1.273094367980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,4,power_law_1.01,1.2748671531677247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,4,power_law_1.2,1.2766976356506348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,4,power_law_1.2,1.3029376029968263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,64,balanced,0.37544000148773193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,64,balanced,0.37577064832051593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,64,power_law_1.01,0.371558403968811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,64,power_law_1.01,0.3731328010559082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,64,power_law_1.2,0.36636159420013426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,64,power_law_1.2,0.37221760749816896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,8,balanced,0.8510719935099283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,8,balanced,0.8514026800791422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,8,power_law_1.01,0.7851903915405274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,8,power_law_1.01,0.7901055812835693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,8,power_law_1.2,0.8003840446472168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,4096,2688,22,512,1,8,power_law_1.2,0.8178367614746094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,1,balanced,0.7893119653066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,1,balanced,0.791045347849528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,1,power_law_1.01,0.924294376373291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,1,power_law_1.01,0.933465576171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,1,power_law_1.2,0.9058560371398926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,1,power_law_1.2,0.922976016998291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,2,balanced,0.4636586507161458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,2,balanced,0.46384533246358234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,2,power_law_1.01,0.5929535865783692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,2,power_law_1.01,0.6967103958129883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,2,power_law_1.2,0.6062592029571533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,2,power_law_1.2,0.629260778427124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,4,balanced,0.3445546627044678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,4,balanced,0.34707732995351154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,4,power_law_1.01,0.4286335945129395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,4,power_law_1.01,0.44815359115600584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,4,power_law_1.2,0.43025918006896974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,4,power_law_1.2,0.4403007984161377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,8,balanced,0.29442665974299115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,8,balanced,0.2967573404312134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,8,power_law_1.01,0.36963839530944825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,8,power_law_1.01,0.37158401012420655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,8,power_law_1.2,0.368889594078064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,1,8,power_law_1.2,0.3785919904708862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,16,1,balanced,0.11584533254305522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,16,1,balanced,0.11692800124486287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,16,1,power_law_1.01,0.11530879735946656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,16,1,power_law_1.01,0.11552000045776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,16,1,power_law_1.2,0.11552000045776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,16,1,power_law_1.2,0.11608959436416626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,2,1,balanced,0.43873600165049237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,2,1,balanced,0.4395893414815267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,2,1,power_law_1.01,0.48215041160583494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,2,1,power_law_1.01,0.4885119915008545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,2,1,power_law_1.2,0.5001920223236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,2,1,power_law_1.2,0.5159488201141358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,32,1,balanced,0.09636267026265462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,32,1,balanced,0.09794132908185323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,32,1,power_law_1.01,0.09658240079879761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,32,1,power_law_1.01,0.09788159728050232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,32,1,power_law_1.2,0.0964735984802246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,32,1,power_law_1.2,0.09709439873695373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,4,1,balanced,0.2385759949684143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,4,1,balanced,0.24597332874933878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,4,1,power_law_1.01,0.28408958911895754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,4,1,power_law_1.01,0.28448638916015623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,4,1,power_law_1.2,0.283788800239563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,4,1,power_law_1.2,0.2845312118530273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,8,1,balanced,0.14070399602254233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,8,1,balanced,0.14078933000564575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,8,1,power_law_1.01,0.17764480113983155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,8,1,power_law_1.01,0.1863168001174927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,8,1,power_law_1.2,0.18625919818878173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,16384,2,8,8,1,power_law_1.2,0.1864127993583679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,1,balanced,2.568474610646566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,1,balanced,2.5690773328145347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,1,power_law_1.01,2.1642112731933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,1,power_law_1.01,2.181043243408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,1,power_law_1.2,2.1796991348266603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,1,power_law_1.2,2.200032043457031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,128,balanced,0.17883733908335367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,128,balanced,0.18033599853515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,128,power_law_1.01,0.17763839960098265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,128,power_law_1.01,0.17772799730300903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,128,power_law_1.2,0.17786879539489747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,128,power_law_1.2,0.1779647946357727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,16,balanced,0.30957333246866864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,16,balanced,0.31033066908518475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,16,power_law_1.01,0.276857590675354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,16,power_law_1.01,0.2993216037750244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,16,power_law_1.2,0.28412160873413084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,16,power_law_1.2,0.28679039478302004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,2,balanced,1.3632853825887044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,2,balanced,1.3637173970540364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,2,power_law_1.01,1.1969728469848633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,2,power_law_1.01,1.2221759796142577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,2,power_law_1.2,1.1813823699951171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,2,power_law_1.2,1.2042176246643066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,256,balanced,0.17245332400004068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,256,balanced,0.1753066579500834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,256,power_law_1.01,0.17111040353775026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,256,power_law_1.01,0.1725119948387146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,256,power_law_1.2,0.17111040353775026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,256,power_law_1.2,0.17136000394821166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,32,balanced,0.23415466149648032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,32,balanced,0.23464532693227133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,32,power_law_1.01,0.2265536069869995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,32,power_law_1.01,0.23071999549865724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,32,power_law_1.2,0.2246272087097168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,32,power_law_1.2,0.23096959590911864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,4,balanced,0.7664586702982584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,4,balanced,0.7687040170033773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,4,power_law_1.01,0.6771071910858154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,4,power_law_1.01,0.6797311782836915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,4,power_law_1.2,0.6645567893981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,4,power_law_1.2,0.6967167854309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,64,balanced,0.19356266657511392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,64,balanced,0.19500799973805746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,64,power_law_1.01,0.1900928020477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,64,power_law_1.01,0.19253120422363282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,64,power_law_1.2,0.1883263945579529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,64,power_law_1.2,0.18978559970855713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,8,balanced,0.45706133047739667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,8,balanced,0.45739734172821045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,8,power_law_1.01,0.43343358039855956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,8,power_law_1.01,0.43569278717041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,8,power_law_1.2,0.42471680641174314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,1,8,power_law_1.2,0.4268223762512207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,16,1,balanced,0.3492586612701416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,16,1,balanced,0.35077865918477374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,16,1,power_law_1.01,0.3233599901199341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,16,1,power_law_1.01,0.3247744083404541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,16,1,power_law_1.2,0.32385280132293703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,16,1,power_law_1.2,0.3261375904083252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,2,1,balanced,1.3682559331258137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,2,1,balanced,1.3685493469238281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,2,1,power_law_1.01,1.1790592193603515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,2,1,power_law_1.01,1.1807871818542481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,2,1,power_law_1.2,1.1957440376281738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,2,1,power_law_1.2,1.1995200157165526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,4,1,balanced,0.46929601828257245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,4,1,balanced,0.4719039996465047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,4,1,power_law_1.01,0.4278848171234131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,4,1,power_law_1.01,0.428985595703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,4,1,power_law_1.2,0.4322624206542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,4,1,power_law_1.2,0.4377151966094971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,8,1,balanced,0.2967413266499837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,8,1,balanced,0.29739199082056683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,8,1,power_law_1.01,0.2728127956390381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,8,1,power_law_1.01,0.27575039863586426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,8,1,power_law_1.2,0.2771327972412109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2048,8,256,8,1,power_law_1.2,0.2786815881729126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,1,balanced,2.0352746645609536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,1,balanced,2.035813331604004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,1,power_law_1.01,1.8810752868652343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,1,power_law_1.01,1.9363519668579101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,1,power_law_1.2,1.9572799682617188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,1,power_law_1.2,1.994553565979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,16,balanced,0.25890666246414185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,16,balanced,0.25913067658742267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,16,power_law_1.01,0.25350399017333985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,16,power_law_1.01,0.25493760108947755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,16,power_law_1.2,0.2543488025665283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,16,power_law_1.2,0.25443201065063475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,2,balanced,1.0818400382995605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,2,balanced,1.0824373563130696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,2,power_law_1.01,1.0185088157653808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,2,power_law_1.01,1.0411135673522949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,2,power_law_1.2,1.0542911529541015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,2,power_law_1.2,1.0776127815246581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,32,balanced,0.1892426609992981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,32,balanced,0.19010132551193237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,32,power_law_1.01,0.18584320545196534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,32,power_law_1.01,0.1877120018005371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,32,power_law_1.2,0.18724479675292968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,32,power_law_1.2,0.1901568055152893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,4,balanced,0.43873600165049237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,4,balanced,0.43944533665974933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,4,power_law_1.01,0.4399424076080322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,4,power_law_1.01,0.45336318016052246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,4,power_law_1.2,0.4407936096191406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,4,power_law_1.2,0.4607552051544189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,8,balanced,0.37164799372355145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,8,balanced,0.37279999256134033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,8,power_law_1.01,0.3637120008468628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,8,power_law_1.01,0.3650559902191162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,8,power_law_1.2,0.36506240367889403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,1,8,power_law_1.2,0.3676032066345215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,2,1,balanced,1.0811413129170735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,2,1,balanced,1.082090695699056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,2,1,power_law_1.01,1.0073663711547851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,2,1,power_law_1.01,1.028876781463623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,2,1,power_law_1.2,1.0433088302612306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,2,1,power_law_1.2,1.0621184349060058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,4,1,balanced,0.3707360029220581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,4,1,balanced,0.37107733885447186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,4,1,power_law_1.01,0.3908544063568115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,4,1,power_law_1.01,0.39352319240570066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,4,1,power_law_1.2,0.40188798904418943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,6144,2560,8,160,4,1,power_law_1.2,0.40221438407897947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,1,balanced,2.992111841837565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,1,balanced,2.9943679173787436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,1,power_law_1.01,2.5783872604370117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,1,power_law_1.01,2.5823104858398436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,1,power_law_1.2,2.556096076965332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,1,power_law_1.2,2.6436607360839846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,128,balanced,0.20166399081548056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,128,balanced,0.20286399126052856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,128,power_law_1.01,0.20106239318847657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,128,power_law_1.01,0.2026815891265869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,128,power_law_1.2,0.20166399478912353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,128,power_law_1.2,0.20212481021881104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,16,balanced,0.35053332646687824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,16,balanced,0.350597341855367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,16,power_law_1.01,0.3305599927902222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,16,power_law_1.01,0.33454079627990724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,16,power_law_1.2,0.3230783939361572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,16,power_law_1.2,0.3300928115844727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,2,balanced,1.5802987416585286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,2,balanced,1.5807199478149414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,2,power_law_1.01,1.3674495697021485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,2,power_law_1.01,1.4351743698120116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,2,power_law_1.2,1.3694720268249512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,2,power_law_1.2,1.4125375747680664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,256,balanced,0.19534399112065634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,256,balanced,0.19742933909098306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,256,power_law_1.01,0.194758403301239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,256,power_law_1.01,0.19530880451202393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,256,power_law_1.2,0.19448319673538209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,256,power_law_1.2,0.1947711944580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,32,balanced,0.26090667645136517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,32,balanced,0.2614293297131856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,32,power_law_1.01,0.25201280117034913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,32,power_law_1.01,0.25484800338745117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,32,power_law_1.2,0.24211199283599855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,32,power_law_1.2,0.2570751905441284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,4,balanced,0.8832159837086996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,4,balanced,0.8838933308919271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,4,power_law_1.01,0.7986752033233643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,4,power_law_1.01,0.8109439849853516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,4,power_law_1.2,0.779744005203247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,4,power_law_1.2,0.7882880210876465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,64,balanced,0.21410133441289267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,64,balanced,0.21522132555643717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,64,power_law_1.01,0.2137216091156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,64,power_law_1.01,0.21415040493011475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,64,power_law_1.2,0.21175038814544678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,64,power_law_1.2,0.2136768102645874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,8,balanced,0.5255733331044515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,8,balanced,0.5256533225377401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,8,power_law_1.01,0.483571195602417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,8,power_law_1.01,0.4967616081237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,8,power_law_1.2,0.4769472122192383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,1,8,power_law_1.2,0.48757758140563967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,16,1,balanced,0.4043840169906616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,16,1,balanced,0.4044373432795207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,16,1,power_law_1.01,0.3738624095916748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,16,1,power_law_1.01,0.38039679527282716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,16,1,power_law_1.2,0.37625598907470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,16,1,power_law_1.2,0.37731199264526366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,2,1,balanced,1.5942400296529133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,2,1,balanced,1.5943573315938313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,2,1,power_law_1.01,1.3607232093811035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,2,1,power_law_1.01,1.3690367698669434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,2,1,power_law_1.2,1.3948800086975097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,2,1,power_law_1.2,1.4005696296691894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,4,1,balanced,0.5523039897282919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,4,1,balanced,0.5540693203608195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,4,1,power_law_1.01,0.49475841522216796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,4,1,power_law_1.01,0.505299186706543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,4,1,power_law_1.2,0.5001023769378662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,4,1,power_law_1.2,0.500819206237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,8,1,balanced,0.3413013219833374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,8,1,balanced,0.34379732608795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,8,1,power_law_1.01,0.3060415983200073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,8,1,power_law_1.01,0.30971519947052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,8,1,power_law_1.2,0.320415997505188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,256,8,1,power_law_1.2,0.32044799327850343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,1,balanced,4.423930803934733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,1,balanced,4.424661318461101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,1,power_law_1.01,3.4623294830322267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,1,power_law_1.01,3.4849857330322265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,1,power_law_1.2,3.4652481079101562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,1,power_law_1.2,3.480486297607422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,128,balanced,0.2564586599667867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,128,balanced,0.25728533665339154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,128,power_law_1.01,0.25471999645233157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,128,power_law_1.01,0.2548799991607666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,128,power_law_1.2,0.25109119415283204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,128,power_law_1.2,0.2550976037979126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,16,balanced,0.49113066991170246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,16,balanced,0.4919039805730184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,16,power_law_1.01,0.4372608184814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,16,power_law_1.01,0.43888001441955565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,16,power_law_1.2,0.4624320030212402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,16,power_law_1.2,0.4693183898925781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,2,balanced,2.3205493291219077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,2,balanced,2.321002642313639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,2,power_law_1.01,1.7948671340942384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,2,power_law_1.01,1.9165376663208007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,2,power_law_1.2,1.8107519149780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,2,power_law_1.2,1.9169536590576173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,32,balanced,0.3608320156733195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,32,balanced,0.3615093231201172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,32,power_law_1.01,0.3383615970611572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,32,power_law_1.01,0.3404608011245728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,32,power_law_1.2,0.3299839973449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,32,power_law_1.2,0.34447360038757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,4,balanced,1.2796533107757568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,4,balanced,1.2833173274993896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,4,power_law_1.01,1.0467647552490233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,4,power_law_1.01,1.0964608192443848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,4,power_law_1.2,1.0737792015075684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,4,power_law_1.2,1.0779007911682128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,64,balanced,0.2894773284594218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,64,balanced,0.28995199998219806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,64,power_law_1.01,0.2835263967514038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,64,power_law_1.01,0.2896960020065308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,64,power_law_1.2,0.27932798862457275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,64,power_law_1.2,0.28716158866882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,8,balanced,0.7583839893341064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,8,balanced,0.7593706448872884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,8,power_law_1.01,0.6368000030517578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,8,power_law_1.01,0.6383168220520019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,8,power_law_1.2,0.6512191772460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,1,8,power_law_1.2,0.6876863956451416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,16,1,balanced,0.3280319968859355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,16,1,balanced,0.3282986680666606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,16,1,power_law_1.01,0.2817728042602539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,16,1,power_law_1.01,0.28519039154052733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,16,1,power_law_1.2,0.28562560081481936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,16,1,power_law_1.2,0.2863039970397949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,2,1,balanced,2.340106646219889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,2,1,balanced,2.3430933952331543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,2,1,power_law_1.01,1.8484031677246093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,2,1,power_law_1.01,1.8913152694702149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,2,1,power_law_1.2,1.8753984451293946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,2,1,power_law_1.2,1.8823808670043944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,4,1,balanced,1.3297173182169597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,4,1,balanced,1.3328853448232014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,4,1,power_law_1.01,1.090067195892334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,4,1,power_law_1.01,1.0904576301574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,4,1,power_law_1.2,1.0312000274658204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,4,1,power_law_1.2,1.0503487586975098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,8,1,balanced,0.4740533431371053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,8,1,balanced,0.4746239980061849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,8,1,power_law_1.01,0.40208001136779786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,8,1,power_law_1.01,0.40307841300964353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,8,1,power_law_1.2,0.39439361095428466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,192,7168,2048,8,384,8,1,power_law_1.2,0.4060031890869141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,1,balanced,0.037605332831541695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,1,balanced,0.04043733328580856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,1,power_law_1.01,0.039878401160240176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,1,power_law_1.01,0.040249601006507874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,1,power_law_1.2,0.040608000755310056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,1,power_law_1.2,0.040940800309181215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,128,balanced,0.037077332536379494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,128,balanced,0.037434667348861694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,128,power_law_1.01,0.03461120128631592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,128,power_law_1.01,0.03597440123558045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,128,power_law_1.2,0.035231998562812804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,128,power_law_1.2,0.035334399342536925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,16,balanced,0.03534399966398875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,16,balanced,0.037418665985266365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,16,power_law_1.01,0.03521920144557953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,16,power_law_1.01,0.035776001214981076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,16,power_law_1.2,0.035667198896408084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,16,power_law_1.2,0.035846400260925296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,2,balanced,0.03748800108830134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,2,balanced,0.03905066599448522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,2,power_law_1.01,0.04362240135669708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,2,power_law_1.01,0.04438399970531463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,2,power_law_1.2,0.042335999011993405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,2,power_law_1.2,0.0423552006483078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,32,balanced,0.03454400102297465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,32,balanced,0.03563733398914337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,32,power_law_1.01,0.035699200630187986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,32,power_law_1.01,0.03573119938373566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,32,power_law_1.2,0.03511039912700653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,32,power_law_1.2,0.03729279935359955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,4,balanced,0.037621334195137024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,4,balanced,0.043525333205858864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,4,power_law_1.01,0.042156800627708435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,4,power_law_1.01,0.04217599928379059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,4,power_law_1.2,0.04044800102710724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,4,power_law_1.2,0.043558400869369504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,64,balanced,0.03740799923737844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,64,balanced,0.03769599894682566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,64,power_law_1.01,0.03430399894714355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,64,power_law_1.01,0.03527039885520935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,64,power_law_1.2,0.03521279990673065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,64,power_law_1.2,0.03603839874267578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,8,balanced,0.03559466699759165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,8,balanced,0.03774933268626531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,8,power_law_1.01,0.03770880103111267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,8,power_law_1.01,0.04014720022678375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,8,power_law_1.2,0.036083200573921205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,1,8,power_law_1.2,0.03809280097484589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,2,1,balanced,0.03136000037193298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,2,1,balanced,0.03152533372243246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,2,1,power_law_1.01,0.03219200074672699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,2,1,power_law_1.01,0.03221119940280914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,2,1,power_law_1.2,0.032313600182533264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,2048,768,8,128,2,1,power_law_1.2,0.032569599151611325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,1,balanced,0.0680320014556249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,1,balanced,0.06841599941253662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,1,power_law_1.01,0.06599040031433105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,1,power_law_1.01,0.06631039977073669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,1,power_law_1.2,0.06600319743156433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,1,power_law_1.2,0.06666880249977111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,128,balanced,0.043621331453323364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,128,balanced,0.04366933306058248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,128,power_law_1.01,0.04200960099697113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,128,power_law_1.01,0.04215039908885956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,128,power_law_1.2,0.04142720103263855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,128,power_law_1.2,0.04213759899139404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,16,balanced,0.04186133543650309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,16,balanced,0.043663998444875084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,16,power_law_1.01,0.07185919880867005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,16,power_law_1.01,0.0725055992603302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,16,power_law_1.2,0.06993280053138733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,16,power_law_1.2,0.07082239985466003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,2,balanced,0.060133333007494606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,2,balanced,0.06102933486302694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,2,power_law_1.01,0.07153919935226441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,2,power_law_1.01,0.07195519804954528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,2,power_law_1.2,0.07178239822387696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,2,power_law_1.2,0.07208960056304932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,256,balanced,0.0436106671889623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,256,balanced,0.04363200068473816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,256,power_law_1.01,0.04184960126876831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,256,power_law_1.01,0.04221439957618713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,256,power_law_1.2,0.04216319918632507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,256,power_law_1.2,0.042438399791717527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,32,balanced,0.04160533348719279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,32,balanced,0.043653334180514015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,32,power_law_1.01,0.05863040089607239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,32,power_law_1.01,0.05909759998321533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,32,power_law_1.2,0.05811840295791626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,32,power_law_1.2,0.0603007972240448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,4,balanced,0.04781866570313772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,4,balanced,0.050069332122802734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,4,power_law_1.01,0.07203199863433837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,4,power_law_1.01,0.07233920097351074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,4,power_law_1.2,0.07133439779281617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,4,power_law_1.2,0.07195519804954528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,64,balanced,0.042037333051363625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,64,balanced,0.04206933577855428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,64,power_law_1.01,0.0430400013923645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,64,power_law_1.01,0.04508160054683685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,64,power_law_1.2,0.043372800946235655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,64,power_law_1.2,0.0440064013004303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,8,balanced,0.043840001026789345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,8,balanced,0.04586666822433472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,8,power_law_1.01,0.07176960110664368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,8,power_law_1.01,0.0720255970954895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,8,power_law_1.2,0.07153279781341552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,1,8,power_law_1.2,0.07206400036811829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,2,1,balanced,0.05020800232887268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,2,1,balanced,0.052943999568621315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,2,1,power_law_1.01,0.05071359872817993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,2,1,power_law_1.01,0.05144320130348205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,2,1,power_law_1.2,0.05003520250320435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,2,1,power_law_1.2,0.05017600059509277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,4,1,balanced,0.039690665900707245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,4,1,balanced,0.0397119993964831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,4,1,power_law_1.01,0.03439359962940216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,4,1,power_law_1.01,0.034944000840187076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,4,1,power_law_1.2,0.036473599076271054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,3072,1536,8,256,4,1,power_law_1.2,0.03689599931240082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,1,balanced,0.18646933635075888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,1,balanced,0.18686399857203165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,1,power_law_1.01,0.17231359481811523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,1,power_law_1.01,0.1738816022872925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,1,power_law_1.2,0.16305919885635375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,1,power_law_1.2,0.17052799463272095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,2,balanced,0.15101333459218344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,2,balanced,0.15217600266138712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,2,power_law_1.01,0.1444991946220398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,2,power_law_1.01,0.15559680461883546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,2,power_law_1.2,0.14365439414978026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,2,power_law_1.2,0.1571776032447815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,4,balanced,0.1276479959487915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,4,balanced,0.1305333375930786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,4,power_law_1.01,0.12961280345916748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,4,power_law_1.01,0.13273600339889527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,4,power_law_1.2,0.1443071961402893
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,4,power_law_1.2,0.16493439674377441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,8,balanced,0.1265066663424174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,8,balanced,0.12777066230773926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,8,power_law_1.01,0.12611839771270753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,8,power_law_1.01,0.12636799812316896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,8,power_law_1.2,0.12654080390930175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,1,8,power_law_1.2,0.12698880434036255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,16,1,balanced,0.04049066702524821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,16,1,balanced,0.04161066561937332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,16,1,power_law_1.01,0.04524799883365631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,16,1,power_law_1.01,0.04639999866485596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,16,1,power_law_1.2,0.04469760060310364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,16,1,power_law_1.2,0.04948480129241943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,2,1,balanced,0.10689600308736165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,2,1,balanced,0.10751466949780782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,2,1,power_law_1.01,0.09380480051040649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,2,1,power_law_1.01,0.10401279926300049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,2,1,power_law_1.2,0.09560319781303406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,2,1,power_law_1.2,0.10319360494613647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,4,1,balanced,0.07311466832955678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,4,1,balanced,0.07701866825421651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,4,1,power_law_1.01,0.07214720249176025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,4,1,power_law_1.01,0.08012160062789916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,4,1,power_law_1.2,0.06825600266456604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,4,1,power_law_1.2,0.06902400255203248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,8,1,balanced,0.0539626677831014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,8,1,balanced,0.0558186670144399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,8,1,power_law_1.01,0.05296639800071716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,8,1,power_law_1.01,0.053523200750350955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,8,1,power_law_1.2,0.052051198482513425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,14336,2,8,8,1,power_law_1.2,0.05588480234146118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,1,balanced,0.07849066456158955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,1,balanced,0.08251733581225078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,1,power_law_1.01,0.07767680287361145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,1,power_law_1.01,0.07879679799079894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,1,power_law_1.2,0.07946879863739013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,1,power_law_1.2,0.07948160171508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,128,balanced,0.045824001232783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,128,balanced,0.046181331078211464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,128,power_law_1.01,0.045184001326560974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,128,power_law_1.01,0.04528000056743622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,128,power_law_1.2,0.044947201013565065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,128,power_law_1.2,0.04527359902858734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,16,balanced,0.045909335215886436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,16,balanced,0.047914668917655945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,16,power_law_1.01,0.06625919938087463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,16,power_law_1.01,0.0679040014743805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,16,power_law_1.2,0.06510720252990723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,16,power_law_1.2,0.06665599942207337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,2,balanced,0.06835199892520905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,2,balanced,0.07019199927647908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,2,power_law_1.01,0.07319039702415467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,2,power_law_1.01,0.07567999958992004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,2,power_law_1.2,0.07496320009231568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,2,power_law_1.2,0.08017920255661011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,32,balanced,0.04574400186538696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,32,balanced,0.04605866471926371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,32,power_law_1.01,0.049516800045967105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,32,power_law_1.01,0.05607039928436279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,32,power_law_1.2,0.05056639909744263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,32,power_law_1.2,0.05570560097694397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,4,balanced,0.05573866764704386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,4,balanced,0.056048000852266945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,4,power_law_1.01,0.07122560143470764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,4,power_law_1.01,0.07322239875793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,4,power_law_1.2,0.06887680292129517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,4,power_law_1.2,0.06936320066452026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,64,balanced,0.04571733375390371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,64,balanced,0.045909335215886436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,64,power_law_1.01,0.04519039988517761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,64,power_law_1.01,0.04538240134716034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,64,power_law_1.2,0.04508799910545349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,64,power_law_1.2,0.04539520144462585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,8,balanced,0.045882667104403176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,8,balanced,0.045941332976023354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,8,power_law_1.01,0.06901760101318359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,8,power_law_1.01,0.0699072003364563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,8,power_law_1.2,0.0655680000782013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,1,8,power_law_1.2,0.06832640171051026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,2,1,balanced,0.0581226646900177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,2,1,balanced,0.059765333930651345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,2,1,power_law_1.01,0.056652802228927615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,2,1,power_law_1.01,0.05674880146980286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,2,1,power_law_1.2,0.05726079940795899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,2,1,power_law_1.2,0.05861759781837463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,4,1,balanced,0.04387199878692627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,4,1,balanced,0.04560000201066335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,4,1,power_law_1.01,0.04442879855632782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,4,1,power_law_1.01,0.04497919976711273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,4,1,power_law_1.2,0.044819200038909913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,1536,8,128,4,1,power_law_1.2,0.04537599980831146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,1,balanced,0.2793440024058024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,1,balanced,0.28334399064381915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,1,power_law_1.01,0.2783679962158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,1,power_law_1.01,0.28037118911743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,1,power_law_1.2,0.27800960540771485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,1,power_law_1.2,0.2788288116455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,128,balanced,0.05209066470464071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,128,balanced,0.05366399884223938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,128,power_law_1.01,0.07209600210189819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,128,power_law_1.01,0.07223680019378662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,128,power_law_1.2,0.07189120054244995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,128,power_law_1.2,0.07306240200996399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,16,balanced,0.07252799967924754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,16,balanced,0.07419733206431071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,16,power_law_1.01,0.22313599586486815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,16,power_law_1.01,0.2238464117050171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,16,power_law_1.2,0.2037503957748413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,16,power_law_1.2,0.20880000591278075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,2,balanced,0.1742239991823832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,2,balanced,0.17492266496022543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,2,power_law_1.01,0.2825279951095581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,2,power_law_1.01,0.2866751909255981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,2,power_law_1.2,0.2383552074432373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,2,power_law_1.2,0.24275200366973876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,256,balanced,0.05216533442338308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,256,balanced,0.05386666456858317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,256,power_law_1.01,0.054636800289154054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,256,power_law_1.01,0.0559935986995697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,256,power_law_1.2,0.05682560205459595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,256,power_law_1.2,0.0587007999420166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,32,balanced,0.06862399975458781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,32,balanced,0.07022400200366974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,32,power_law_1.01,0.13791359663009645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,32,power_law_1.01,0.1385856032371521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,32,power_law_1.2,0.1376960039138794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,32,power_law_1.2,0.13814400434494017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,4,balanced,0.1076586643854777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,4,balanced,0.10806933045387268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,4,power_law_1.01,0.2827264070510864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,4,power_law_1.01,0.2848959922790527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,4,power_law_1.2,0.21756160259246826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,4,power_law_1.2,0.23019518852233886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,64,balanced,0.058304001887639366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,64,balanced,0.060533334811528526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,64,power_law_1.01,0.08543999791145325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,64,power_law_1.01,0.08776959776878357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,64,power_law_1.2,0.08552320003509521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,64,power_law_1.2,0.0871936023235321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,8,balanced,0.08463999629020691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,8,balanced,0.08538132905960083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,8,power_law_1.01,0.28545279502868653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,8,power_law_1.01,0.2868160009384155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,8,power_law_1.2,0.19519360065460206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,4096,2688,22,512,1,8,power_law_1.2,0.19872000217437744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,1,balanced,0.26500266790390015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,1,balanced,0.2672533392906189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,1,power_law_1.01,0.24900479316711427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,1,power_law_1.01,0.2510591983795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,1,power_law_1.2,0.2401279926300049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,1,power_law_1.2,0.24450559616088868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,2,balanced,0.2057653268178304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,2,balanced,0.21061333020528158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,2,power_law_1.01,0.21972479820251464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,2,power_law_1.01,0.23756799697875977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,2,power_law_1.2,0.18880640268325805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,2,power_law_1.2,0.1900928020477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,4,balanced,0.1613599956035614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,4,balanced,0.16164799531300864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,4,power_law_1.01,0.16346880197525024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,4,power_law_1.01,0.1662783980369568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,4,power_law_1.2,0.16295679807662963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,4,power_law_1.2,0.17950719594955444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,8,balanced,0.1586240033308665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,8,balanced,0.1588106652100881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,8,power_law_1.01,0.15630719661712647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,8,power_law_1.01,0.15644160509109498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,8,power_law_1.2,0.1565567970275879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,1,8,power_law_1.2,0.17843199968338014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,16,1,balanced,0.058090666929880776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,16,1,balanced,0.06011199951171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,16,1,power_law_1.01,0.05839359760284424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,16,1,power_law_1.01,0.05882880091667175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,16,1,power_law_1.2,0.05845119953155518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,16,1,power_law_1.2,0.05886080265045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,2,1,balanced,0.1476746698220571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,2,1,balanced,0.14841066797574362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,2,1,power_law_1.01,0.13461120128631593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,2,1,power_law_1.01,0.145798397064209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,2,1,power_law_1.2,0.13152639865875243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,2,1,power_law_1.2,0.13706239461898803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,32,1,balanced,0.04646400113900503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,32,1,balanced,0.04781333108743032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,32,1,power_law_1.01,0.0506879985332489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,32,1,power_law_1.01,0.05307520031929016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,32,1,power_law_1.2,0.04726400077342987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,32,1,power_law_1.2,0.05082240104675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,4,1,balanced,0.09701333443323772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,4,1,balanced,0.11195199688275655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,4,1,power_law_1.01,0.08423680067062378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,4,1,power_law_1.01,0.08762239813804626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,4,1,power_law_1.2,0.08559359908103943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,4,1,power_law_1.2,0.09397119879722596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,8,1,balanced,0.07111999889214833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,8,1,balanced,0.07147733370463054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,8,1,power_law_1.01,0.06963199973106385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,8,1,power_law_1.01,0.07288320064544677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,8,1,power_law_1.2,0.06504319906234741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,16384,2,8,8,1,power_law_1.2,0.06759679913520814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,1,balanced,0.13397333025932312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,1,balanced,0.1365386644999186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,1,power_law_1.01,0.13404799699783326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,1,power_law_1.01,0.13537280559539794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,1,power_law_1.2,0.13571200370788575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,1,power_law_1.2,0.13579519987106323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,128,balanced,0.055999999245007835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,128,balanced,0.05602666735649109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,128,power_law_1.01,0.05984640121459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,128,power_law_1.01,0.06651520133018493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,128,power_law_1.2,0.05818880200386047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,128,power_law_1.2,0.06220160126686096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,16,balanced,0.05611200133959452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,16,balanced,0.05614933371543884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,16,power_law_1.01,0.13965439796447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,16,power_law_1.01,0.14088319540023803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,16,power_law_1.2,0.1364416003227234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,16,power_law_1.2,0.13997440338134765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,2,balanced,0.09678933024406433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,2,balanced,0.0977280040582021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,2,power_law_1.01,0.14110080003738404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,2,power_law_1.01,0.14383360147476196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,2,power_law_1.2,0.1388864040374756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,2,power_law_1.2,0.14024959802627562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,256,balanced,0.055173332492510475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,256,balanced,0.05597866574923197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,256,power_law_1.01,0.05432320237159729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,256,power_law_1.01,0.05441280007362366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,256,power_law_1.2,0.05418239831924439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,256,power_law_1.2,0.05544319748878479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,32,balanced,0.054154664278030396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,32,balanced,0.056186666091283165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,32,power_law_1.01,0.09492480158805847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,32,power_law_1.01,0.09514880180358887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,32,power_law_1.2,0.09390720129013061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,32,power_law_1.2,0.0958079993724823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,4,balanced,0.08031466603279114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,4,balanced,0.08075200021266937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,4,power_law_1.01,0.14061440229415895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,4,power_law_1.01,0.1425984025001526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,4,power_law_1.2,0.13616640567779542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,4,power_law_1.2,0.13827840089797974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,64,balanced,0.054058666030565895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,64,balanced,0.05598933498064677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,64,power_law_1.01,0.07643520236015319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,64,power_law_1.01,0.07745919823646545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,64,power_law_1.2,0.07807999849319458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,64,power_law_1.2,0.07861760258674622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,8,balanced,0.058602665861447654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,8,balanced,0.05978666742642721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,8,power_law_1.01,0.14413440227508545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,8,power_law_1.01,0.14543360471725464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,8,power_law_1.2,0.13680000305175782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,1,8,power_law_1.2,0.13982080221176146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,16,1,balanced,0.04789866507053375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,16,1,balanced,0.052005335688591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,16,1,power_law_1.01,0.045977601408958436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,16,1,power_law_1.01,0.046137601137161255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,16,1,power_law_1.2,0.045721599459648134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,16,1,power_law_1.2,0.047065600752830505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,2,1,balanced,0.08823466300964355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,2,1,balanced,0.0888426701227824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,2,1,power_law_1.01,0.08629119992256165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,2,1,power_law_1.01,0.08680319786071777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,2,1,power_law_1.2,0.08661119937896729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,2,1,power_law_1.2,0.08695679903030396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,4,1,balanced,0.06834133466084798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,4,1,balanced,0.06894400219122569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,4,1,power_law_1.01,0.06675840020179749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,4,1,power_law_1.01,0.06767359972000123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,4,1,power_law_1.2,0.06750079989433289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,4,1,power_law_1.2,0.06779519915580749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,8,1,balanced,0.05187733471393585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,8,1,balanced,0.051914667089780174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,8,1,power_law_1.01,0.051052802801132204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,8,1,power_law_1.2,0.050374400615692136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2048,8,256,8,1,power_law_1.2,0.05177599787712097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,1,balanced,0.18181333939234415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,1,balanced,0.18427199125289917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,1,power_law_1.01,0.18218239545822143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,1,power_law_1.01,0.18348159790039062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,1,power_law_1.2,0.17909120321273803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,1,power_law_1.2,0.1850111961364746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,16,balanced,0.05801066756248474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,16,balanced,0.05806399881839752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,16,power_law_1.01,0.11640959978103638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,16,power_law_1.01,0.1204800009727478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,16,power_law_1.2,0.1059648036956787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,16,power_law_1.2,0.11384320259094238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,2,balanced,0.10551466544469197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,2,balanced,0.10710933804512024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,2,power_law_1.01,0.17755520343780518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,2,power_law_1.01,0.18737280368804932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,2,power_law_1.2,0.13472000360488892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,2,power_law_1.2,0.14765440225601195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,32,balanced,0.057999998331069946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,32,balanced,0.05818133552869161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,32,power_law_1.01,0.08722559809684753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,32,power_law_1.01,0.08843520283699036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,32,power_law_1.2,0.08673279881477355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,32,power_law_1.2,0.08768640160560608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,4,balanced,0.09643200039863586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,4,balanced,0.10096533099810283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,4,power_law_1.01,0.16428799629211427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,4,power_law_1.01,0.17114239931106567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,4,power_law_1.2,0.12480000257492066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,4,power_law_1.2,0.12547199726104735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,8,balanced,0.07040533423423767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,8,balanced,0.07254933317502339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,8,power_law_1.01,0.14465919733047486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,8,power_law_1.01,0.17112319469451903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,8,power_law_1.2,0.11422079801559448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,1,8,power_law_1.2,0.11920000314712524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,2,1,balanced,0.10097066561381023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,2,1,balanced,0.10108266274134318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,2,1,power_law_1.01,0.0986240029335022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,2,1,power_law_1.01,0.09960319995880126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,2,1,power_law_1.2,0.09878399968147278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,2,1,power_law_1.2,0.09879040122032165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,4,1,balanced,0.07227733234564464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,4,1,balanced,0.07237333556016286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,4,1,power_law_1.01,0.07214080095291138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,4,1,power_law_1.01,0.07333760261535645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,4,1,power_law_1.2,0.07143679857254029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,6144,2560,8,160,4,1,power_law_1.2,0.0720192015171051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,1,balanced,0.14969066778818765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,1,balanced,0.15051199992497763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,1,power_law_1.01,0.1485759973526001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,1,power_law_1.01,0.15006719827651976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,1,power_law_1.2,0.14809600114822388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,1,power_law_1.2,0.1488767981529236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,128,balanced,0.06016000111897787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,128,balanced,0.060165335734685264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,128,power_law_1.01,0.0717311978340149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,128,power_law_1.01,0.07368320226669312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,128,power_law_1.2,0.07433599829673768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,128,power_law_1.2,0.0754047989845276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,16,balanced,0.05810666580994924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,16,balanced,0.0602400004863739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,16,power_law_1.01,0.15514880418777466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,16,power_law_1.01,0.15593600273132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,16,power_law_1.2,0.1514623999595642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,16,power_law_1.2,0.15640319585800172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,2,balanced,0.10710933804512024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,2,balanced,0.10753066341082256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,2,power_law_1.01,0.1547775983810425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,2,power_law_1.01,0.15526399612426758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,2,power_law_1.2,0.15171200037002563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,2,power_law_1.2,0.15344640016555786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,256,balanced,0.05986666679382324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,256,balanced,0.061610668897628784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,256,power_law_1.01,0.05839999914169312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,256,power_law_1.01,0.05885440111160278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,256,power_law_1.2,0.05812479853630066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,256,power_law_1.2,0.058412802219390866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,32,balanced,0.05852266649405161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,32,balanced,0.059978668888409935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,32,power_law_1.01,0.10376319885253907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,32,power_law_1.01,0.1044160008430481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,32,power_law_1.2,0.10427520275115967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,32,power_law_1.2,0.10432000160217285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,4,balanced,0.08714133501052856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,4,balanced,0.08724799752235413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,4,power_law_1.01,0.15479040145874023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,4,power_law_1.01,0.1559231996536255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,4,power_law_1.2,0.15311360359191895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,4,power_law_1.2,0.15315840244293213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,64,balanced,0.060032000144322716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,64,balanced,0.06238933404286703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,64,power_law_1.01,0.08396160006523132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,64,power_law_1.01,0.08524799942970276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,64,power_law_1.2,0.08328319787979126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,64,power_law_1.2,0.08525440096855164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,8,balanced,0.06818666557470958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,8,balanced,0.0683786670366923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,8,power_law_1.01,0.15812480449676514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,8,power_law_1.01,0.1592319965362549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,8,power_law_1.2,0.15781760215759277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,1,8,power_law_1.2,0.15920640230178834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,16,1,balanced,0.05198400219281515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,16,1,balanced,0.054383998115857445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,16,1,power_law_1.01,0.049702399969100954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,16,1,power_law_1.01,0.05041279792785645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,16,1,power_law_1.2,0.05086719989776611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,16,1,power_law_1.2,0.054841601848602296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,2,1,balanced,0.09858666857083638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,2,1,balanced,0.09866133332252502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,2,1,power_law_1.01,0.09455999732017517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,2,1,power_law_1.01,0.09560319781303406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,2,1,power_law_1.2,0.0942911982536316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,2,1,power_law_1.2,0.09534080028533935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,4,1,balanced,0.07446933289368947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,4,1,balanced,0.0766293356815974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,4,1,power_law_1.01,0.073580801486969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,4,1,power_law_1.01,0.07374719977378845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,4,1,power_law_1.2,0.07396479845046997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,4,1,power_law_1.2,0.07483519911766053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,8,1,balanced,0.05786666770776113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,8,1,balanced,0.05969599882761637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,8,1,power_law_1.01,0.05808640122413635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,8,1,power_law_1.01,0.05896959900856018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,8,1,power_law_1.2,0.05816320180892944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,256,8,1,power_law_1.2,0.05829120278358459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,1,balanced,0.15178133050600687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,1,balanced,0.1520746648311615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,1,power_law_1.01,0.14948480129241942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,1,power_law_1.01,0.15018240213394166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,1,power_law_1.2,0.14947839975357055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,1,power_law_1.2,0.14952319860458374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,128,balanced,0.05989866455396017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,128,balanced,0.060266668597857155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,128,power_law_1.01,0.07864959836006165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,128,power_law_1.01,0.0791487991809845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,128,power_law_1.2,0.07865599989891052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,128,power_law_1.2,0.07946879863739013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,16,balanced,0.05820799867312113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,16,balanced,0.060218666990598045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,16,power_law_1.01,0.15605759620666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,16,power_law_1.01,0.15656960010528564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,16,power_law_1.2,0.15569920539855958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,16,power_law_1.2,0.15618560314178467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,2,balanced,0.10638399918874104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,2,balanced,0.10805333654085796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,2,power_law_1.01,0.15400320291519165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,2,power_law_1.01,0.15507199764251708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,2,power_law_1.2,0.15429120063781737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,2,power_law_1.2,0.15492479801177977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,32,balanced,0.0599839985370636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,32,balanced,0.06327466666698456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,32,power_law_1.01,0.13133440017700196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,32,power_law_1.01,0.13230719566345214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,32,power_law_1.2,0.13105920553207398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,32,power_law_1.2,0.13187839984893798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,4,balanced,0.08683199683825175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,4,balanced,0.08705600102742513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,4,power_law_1.01,0.15471999645233153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,4,power_law_1.01,0.1549888014793396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,4,power_law_1.2,0.15407999753952026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,4,power_law_1.2,0.15518720149993898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,64,balanced,0.0591786652803421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,64,balanced,0.06423466900984447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,64,power_law_1.01,0.09170560240745544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,64,power_law_1.01,0.09292160272598267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,64,power_law_1.2,0.09140480160713196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,64,power_law_1.2,0.09265919923782348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,8,balanced,0.07042666773001353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,8,balanced,0.07450133562088013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,8,power_law_1.01,0.15389440059661866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,8,power_law_1.01,0.1564288020133972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,8,power_law_1.2,0.15507199764251708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,1,8,power_law_1.2,0.1563199996948242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,16,1,balanced,0.05383466680844625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,16,1,balanced,0.05402133365472158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,16,1,power_law_1.01,0.0500544011592865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,16,1,power_law_1.01,0.05053439736366272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,16,1,power_law_1.2,0.05013759732246399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,16,1,power_law_1.2,0.05028480291366577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,2,1,balanced,0.09732266267140706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,2,1,balanced,0.09909333785374959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,2,1,power_law_1.01,0.09455360174179077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,2,1,power_law_1.01,0.09525759816169739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,2,1,power_law_1.2,0.09481599926948547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,2,1,power_law_1.2,0.09492480158805847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,4,1,balanced,0.07607466479142506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,4,1,balanced,0.07686399916807811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,4,1,power_law_1.01,0.07360000014305115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,4,1,power_law_1.01,0.07375360131263733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,4,1,power_law_1.2,0.07374079823493958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,4,1,power_law_1.2,0.07416319847106934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,8,1,balanced,0.059215997656186424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,8,1,balanced,0.05959466596444448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,8,1,power_law_1.01,0.057894402742385866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,8,1,power_law_1.01,0.05847679972648621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,8,1,power_law_1.2,0.058310401439666745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2,7168,2048,8,384,8,1,power_law_1.2,0.05851519703865051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,1,balanced,0.4846133391062419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,1,balanced,0.48626665274302167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,1,power_law_1.01,0.5635839939117432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,1,power_law_1.01,0.56528639793396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,1,power_law_1.2,0.562336015701294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,1,power_law_1.2,0.5660799980163574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,128,balanced,0.1850879987080892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,128,balanced,0.18635199467341104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,128,power_law_1.01,0.19736319780349731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,128,power_law_1.01,0.19786239862442018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,128,power_law_1.2,0.21306240558624268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,128,power_law_1.2,0.2140415906906128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,16,balanced,0.20556267102559408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,16,balanced,0.20562666654586792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,16,power_law_1.01,0.2314176082611084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,16,power_law_1.01,0.2327104091644287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,16,power_law_1.2,0.24019200801849366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,16,power_law_1.2,0.2442176103591919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,2,balanced,0.3536800146102905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,2,balanced,0.3539573351542155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,2,power_law_1.01,0.4073535919189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,2,power_law_1.01,0.4120192050933838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,2,power_law_1.2,0.42615041732788084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,2,power_law_1.2,0.4302847862243652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,32,balanced,0.1928266684214274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,32,balanced,0.19529066483179727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,32,power_law_1.01,0.21659519672393798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,32,power_law_1.01,0.22191359996795654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,32,power_law_1.2,0.22198400497436524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,32,power_law_1.2,0.22366719245910643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,4,balanced,0.2707253297170003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,4,balanced,0.27115732431411743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,4,power_law_1.01,0.31554560661315917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,4,power_law_1.01,0.32318720817565916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,4,power_law_1.2,0.3221951961517334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,4,power_law_1.2,0.3312319993972778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,64,balanced,0.18752533197402954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,64,balanced,0.18810667594273886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,64,power_law_1.01,0.204915189743042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,64,power_law_1.01,0.20899839401245118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,64,power_law_1.2,0.2178112030029297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,64,power_law_1.2,0.22415359020233155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,8,balanced,0.22869867086410522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,8,balanced,0.22913066546122232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,8,power_law_1.01,0.2543488025665283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,8,power_law_1.01,0.267577600479126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,8,power_law_1.2,0.26917119026184083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,1,8,power_law_1.2,0.278656005859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,2,1,balanced,0.30828267335891724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,2,1,balanced,0.3094613353411357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,2,1,power_law_1.01,0.34606080055236815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,2,1,power_law_1.01,0.3488384008407593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,2,1,power_law_1.2,0.34898560047149657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,2048,768,8,128,2,1,power_law_1.2,0.35474560260772703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,1,balanced,1.295418659845988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,1,balanced,1.2954506874084473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,1,power_law_1.01,1.7641792297363281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,1,power_law_1.01,1.7709375381469727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,1,power_law_1.2,1.8174720764160157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,1,power_law_1.2,1.8301055908203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,128,balanced,0.32850666840871173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,128,balanced,0.32892799377441406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,128,power_law_1.01,0.3535680055618286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,128,power_law_1.01,0.36008319854736326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,128,power_law_1.2,0.37309439182281495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,128,power_law_1.2,0.3791232109069824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,16,balanced,0.38437867164611816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,16,balanced,0.3860479990641276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,16,power_law_1.01,0.45379199981689455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,16,power_law_1.01,0.46131200790405275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,16,power_law_1.2,0.4682303905487061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,16,power_law_1.2,0.47543039321899416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,2,balanced,0.832090695699056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,2,balanced,0.8347520033518473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,2,power_law_1.01,1.0887743949890136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,2,power_law_1.01,1.1157183647155762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,2,power_law_1.2,1.1400768280029296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,2,power_law_1.2,1.1454079627990723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,256,balanced,0.3248053391774495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,256,balanced,0.326474666595459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,256,power_law_1.01,0.343507194519043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,256,power_law_1.01,0.3436608076095581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,256,power_law_1.2,0.36092801094055177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,256,power_law_1.2,0.3668031930923462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,32,balanced,0.3501226504643758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,32,balanced,0.350602666536967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,32,power_law_1.01,0.4004799842834473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,32,power_law_1.01,0.4074431896209717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,32,power_law_1.2,0.4131648063659668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,32,power_law_1.2,0.4273856163024902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,4,balanced,0.5838079849878947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,4,balanced,0.5841279824574789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,4,power_law_1.01,0.7371071815490723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,4,power_law_1.01,0.7565951824188233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,4,power_law_1.2,0.7493951797485352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,4,power_law_1.2,0.7604032039642334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,64,balanced,0.33483731746673584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,64,balanced,0.3359520037968953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,64,power_law_1.01,0.37635838985443115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,64,power_law_1.01,0.38027520179748536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,64,power_law_1.2,0.3927488088607788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,64,power_law_1.2,0.399833607673645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,8,balanced,0.4515146811803182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,8,balanced,0.45213866233825684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,8,power_law_1.01,0.551526403427124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,8,power_law_1.01,0.5571839809417725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,8,power_law_1.2,0.5744895935058594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,1,8,power_law_1.2,0.585913610458374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,2,1,balanced,0.7469120025634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,2,1,balanced,0.7485067049662272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,2,1,power_law_1.01,0.9903936386108398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,2,1,power_law_1.01,1.0006912231445313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,2,1,power_law_1.2,1.0372096061706544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,2,1,power_law_1.2,1.0378496170043945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,4,1,balanced,0.47572799523671466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,4,1,balanced,0.4757653474807739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,4,1,power_law_1.01,0.6008063793182373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,4,1,power_law_1.01,0.6048192024230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,4,1,power_law_1.2,0.6243904113769532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,3072,1536,8,256,4,1,power_law_1.2,0.6335616111755371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,1,balanced,2.8640054066975913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,1,balanced,2.8837385177612305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,1,power_law_1.01,3.035878372192383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,1,power_law_1.01,3.0518720626831053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,1,power_law_1.2,3.0253503799438475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,1,power_law_1.2,3.044595146179199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,2,balanced,1.7008213996887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,2,balanced,1.702778657277425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,2,power_law_1.01,2.0347455978393554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,2,power_law_1.01,2.260870361328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,2,power_law_1.2,2.1901248931884765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,2,power_law_1.2,2.3956159591674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,4,balanced,1.0666293303171794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,4,balanced,1.0702933470408122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,4,power_law_1.01,1.6767232894897461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,4,power_law_1.01,1.8331968307495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,4,power_law_1.2,1.8866304397583007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,4,power_law_1.2,1.9049152374267577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,8,balanced,0.7515040238698324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,8,balanced,0.7517600059509277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,8,power_law_1.01,1.5347135543823243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,8,power_law_1.01,1.5860735893249511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,8,power_law_1.2,1.5097151756286622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,1,8,power_law_1.2,1.6296960830688476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,16,1,balanced,0.278714656829834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,16,1,balanced,0.2810453375180562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,16,1,power_law_1.01,0.2825536012649536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,16,1,power_law_1.01,0.2836416006088257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,16,1,power_law_1.2,0.28178560733795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,16,1,power_law_1.2,0.28296959400177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,2,1,balanced,1.4636640548706055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,2,1,balanced,1.4657227198282878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,2,1,power_law_1.01,1.5384575843811035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,2,1,power_law_1.01,1.5419327735900878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,2,1,power_law_1.2,1.5388735771179198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,2,1,power_law_1.2,1.5437439918518066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,4,1,balanced,0.7863626480102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,4,1,balanced,0.7907466888427734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,4,1,power_law_1.01,0.8128191947937011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,4,1,power_law_1.01,0.8180543899536132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,4,1,power_law_1.2,0.8158528327941894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,4,1,power_law_1.2,0.822815990447998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,8,1,balanced,0.44844265778859455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,8,1,balanced,0.4484853347142537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,8,1,power_law_1.01,0.4606783866882324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,8,1,power_law_1.01,0.46648321151733396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,8,1,power_law_1.2,0.4585792064666748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,14336,2,8,8,1,power_law_1.2,0.46679039001464845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,1,balanced,1.455850601196289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,1,balanced,1.457797368367513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,1,power_law_1.01,1.8012544631958007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,1,power_law_1.01,1.802297592163086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,1,power_law_1.2,1.8250303268432617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,1,power_law_1.2,1.8364479064941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,128,balanced,0.3370720148086548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,128,balanced,0.33879999319712323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,128,power_law_1.01,0.3896768093109131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,128,power_law_1.01,0.3937279939651489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,128,power_law_1.2,0.43036160469055174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,128,power_law_1.2,0.4378176212310791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,16,balanced,0.3999520142873128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,16,balanced,0.4006346861521403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,16,power_law_1.01,0.49361281394958495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,16,power_law_1.01,0.49957761764526365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,16,power_law_1.2,0.5232319831848145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,16,power_law_1.2,0.576857614517212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,2,balanced,0.9177119731903076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,2,balanced,0.9184799989064535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,2,power_law_1.01,1.1427200317382813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,2,power_law_1.01,1.152729606628418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,2,power_law_1.2,1.1703424453735352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,2,power_law_1.2,1.1768192291259765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,32,balanced,0.36372268199920654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,32,balanced,0.3643146753311157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,32,power_law_1.01,0.43584637641906737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,32,power_law_1.01,0.45450878143310547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,32,power_law_1.2,0.4669248104095459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,32,power_law_1.2,0.4886591911315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,4,balanced,0.6263466676076254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,4,balanced,0.6298133134841919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,4,power_law_1.01,0.7728000164031983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,4,power_law_1.01,0.782751989364624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,4,power_law_1.2,0.8178112030029296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,4,power_law_1.2,0.8179903984069824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,64,balanced,0.3457760016123454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,64,balanced,0.34652801354726154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,64,power_law_1.01,0.41864957809448244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,64,power_law_1.01,0.4218560218811035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,64,power_law_1.2,0.45136637687683107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,64,power_law_1.2,0.4564032077789307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,8,balanced,0.47677334149678546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,8,balanced,0.47783998648325604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,8,power_law_1.01,0.621395206451416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,8,power_law_1.01,0.6457151889801025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,8,power_law_1.2,0.6159808158874511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,1,8,power_law_1.2,0.6891903877258301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,2,1,balanced,0.8476479848225912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,2,1,balanced,0.8492213090260824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,2,1,power_law_1.01,0.9942912101745606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,2,1,power_law_1.01,0.9944128036499024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,2,1,power_law_1.2,0.9926400184631348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,2,1,power_law_1.2,1.0012415885925292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,4,1,balanced,0.5386399825414022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,4,1,balanced,0.5400426785151163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,4,1,power_law_1.01,0.6104832172393799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,4,1,power_law_1.01,0.6141695976257324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,4,1,power_law_1.2,0.6154431819915771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,1536,8,128,4,1,power_law_1.2,0.6229568004608155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,1,balanced,8.976890563964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,1,balanced,8.978458404541016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,1,power_law_1.01,9.145203399658204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,1,power_law_1.01,9.16126708984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,1,power_law_1.2,9.296166229248048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,1,power_law_1.2,9.348121643066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,128,balanced,1.2606453100840251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,128,balanced,1.2635253270467122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,128,power_law_1.01,1.3619711875915528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,128,power_law_1.01,1.365824031829834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,128,power_law_1.2,1.4116224288940429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,128,power_law_1.2,1.4201472282409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,16,balanced,1.701866626739502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,16,balanced,1.7038826942443848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,16,power_law_1.01,1.838265609741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,16,power_law_1.01,1.853580856323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,16,power_law_1.2,1.9493951797485352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,16,power_law_1.2,2.0019392013549804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,2,balanced,5.1475785573323565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,2,balanced,5.149013201395671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,2,power_law_1.01,5.322553634643555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,2,power_law_1.01,5.378924942016601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,2,power_law_1.2,5.449407958984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,2,power_law_1.2,5.61262092590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,256,balanced,1.2287840048472087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,256,balanced,1.2323626677195232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,256,power_law_1.01,1.3157055854797364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,256,power_law_1.01,1.3161727905273437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,256,power_law_1.2,1.3615103721618653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,256,power_law_1.2,1.3745023727416992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,32,balanced,1.4489067395528157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,32,balanced,1.4489226341247559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,32,power_law_1.01,1.5902720451354981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,32,power_law_1.01,1.6150720596313477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,32,power_law_1.2,1.6297536849975587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,32,power_law_1.2,1.657209587097168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,4,balanced,3.182501475016276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,4,balanced,3.184213320414225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,4,power_law_1.01,3.3767040252685545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,4,power_law_1.01,3.382329559326172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,4,power_law_1.2,3.481523132324219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,4,power_law_1.2,3.56927375793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,64,balanced,1.3214826583862305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,64,balanced,1.3257546424865723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,64,power_law_1.01,1.4420736312866211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,64,power_law_1.01,1.4537983894348145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,64,power_law_1.2,1.4800383567810058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,64,power_law_1.2,1.5059904098510741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,8,balanced,2.197312037150065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,8,balanced,2.2013227144877114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,8,power_law_1.01,2.373094367980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,8,power_law_1.01,2.397126388549805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,8,power_law_1.2,2.511078453063965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,4096,2688,22,512,1,8,power_law_1.2,2.5243520736694336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,1,balanced,4.659839948018392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,1,balanced,4.661770820617676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,1,power_law_1.01,4.849068832397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,1,power_law_1.01,4.919910430908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,1,power_law_1.2,4.846316909790039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,1,power_law_1.2,4.8830078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,2,balanced,2.6496960322062173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,2,balanced,2.650309403737386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,2,power_law_1.01,3.659648132324219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,2,power_law_1.01,3.6696193695068358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,2,power_law_1.2,3.0785343170166017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,2,power_law_1.2,3.4206783294677736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,4,balanced,1.5708799362182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,4,balanced,1.57097593943278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,4,power_law_1.01,2.5302656173706053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,4,power_law_1.01,2.9776256561279295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,4,power_law_1.2,2.591744041442871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,4,power_law_1.2,3.0703039169311523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,8,balanced,1.0927146275838215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,8,balanced,1.0967786312103271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,8,power_law_1.01,2.1715072631835937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,8,power_law_1.01,2.316780853271484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,8,power_law_1.2,2.4267711639404297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,1,8,power_law_1.2,2.4419904708862306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,16,1,balanced,0.41703999042510986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,16,1,balanced,0.4184533357620239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,16,1,power_law_1.01,0.41925759315490724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,16,1,power_law_1.01,0.4249407768249512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,16,1,power_law_1.2,0.42062082290649416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,16,1,power_law_1.2,0.42197117805480955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,2,1,balanced,2.3671199480692544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,2,1,balanced,2.3689014116923013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,2,1,power_law_1.01,2.4635904312133787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,2,1,power_law_1.01,2.4728960037231444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,2,1,power_law_1.2,2.4410560607910154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,2,1,power_law_1.2,2.443654441833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,32,1,balanced,0.26492265860239667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,32,1,balanced,0.2653546730677287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,32,1,power_law_1.01,0.268556809425354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,32,1,power_law_1.01,0.26874239444732667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,32,1,power_law_1.2,0.26803200244903563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,32,1,power_law_1.2,0.26832640171051025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,4,1,balanced,1.2394239902496338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,4,1,balanced,1.2395093441009521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,4,1,power_law_1.01,1.3047679901123046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,4,1,power_law_1.01,1.3057279586791992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,4,1,power_law_1.2,1.2825407981872559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,4,1,power_law_1.2,1.3010496139526366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,8,1,balanced,0.6767786343892416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,8,1,balanced,0.6777013142903646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,8,1,power_law_1.01,0.7245759963989258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,8,1,power_law_1.01,0.7285888195037842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,8,1,power_law_1.2,0.7192255973815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,16384,2,8,8,1,power_law_1.2,0.720908784866333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,1,balanced,2.9934186935424805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,1,balanced,2.996218681335449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,1,power_law_1.01,4.245868682861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,1,power_law_1.01,4.248608016967774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,1,power_law_1.2,4.4176383972167965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,1,power_law_1.2,4.443807983398438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,128,balanced,0.515008012453715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,128,balanced,0.5164426565170288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,128,power_law_1.01,0.5949376106262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,128,power_law_1.01,0.6036928176879883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,128,power_law_1.2,0.628768014907837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,128,power_law_1.2,0.6302720069885254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,16,balanced,0.6573866605758667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,16,balanced,0.6593919992446899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,16,power_law_1.01,0.81277437210083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,16,power_law_1.01,0.825715160369873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,16,power_law_1.2,0.8557632446289063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,16,power_law_1.2,0.8880640029907226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,2,balanced,1.7838080724080403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,2,balanced,1.785871982574463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,2,power_law_1.01,2.483244705200195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,2,power_law_1.01,2.5239744186401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,2,power_law_1.2,2.5380287170410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,2,power_law_1.2,2.5601408004760744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,256,balanced,0.5081439812978109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,256,balanced,0.5095146497090658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,256,power_law_1.01,0.5565120220184326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,256,power_law_1.01,0.5695551872253418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,256,power_law_1.2,0.5963520050048828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,256,power_law_1.2,0.6091135978698731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,32,balanced,0.5758399963378906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,32,balanced,0.5762826601664225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,32,power_law_1.01,0.7074048042297363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,32,power_law_1.01,0.710316801071167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,32,power_law_1.2,0.7535999774932861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,32,power_law_1.2,0.7753087997436523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,4,balanced,1.1498239835103352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,4,balanced,1.152026653289795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,4,power_law_1.01,1.5296192169189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,4,power_law_1.01,1.5571583747863769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,4,power_law_1.2,1.6435583114624024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,4,power_law_1.2,1.6462015151977538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,64,balanced,0.5315146843592325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,64,balanced,0.5334719816843668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,64,power_law_1.01,0.62773118019104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,64,power_law_1.01,0.6311168193817138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,64,power_law_1.2,0.6649024009704589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,64,power_law_1.2,0.67324800491333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,8,balanced,0.8006772994995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,8,balanced,0.8024373054504395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,8,power_law_1.01,1.0926527976989746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,8,power_law_1.01,1.1054271697998046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,8,power_law_1.2,1.1827839851379394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,1,8,power_law_1.2,1.2261952400207519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,16,1,balanced,0.5224106709162394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,16,1,balanced,0.5227786699930826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,16,1,power_law_1.01,0.6480832099914551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,16,1,power_law_1.01,0.6481599807739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,16,1,power_law_1.2,0.6933440208435059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,16,1,power_law_1.2,0.6944640159606934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,2,1,balanced,1.6494560241699219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,2,1,balanced,1.6502399444580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,2,1,power_law_1.01,2.312019157409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,2,1,power_law_1.01,2.323801612854004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,2,1,power_law_1.2,2.3908159255981447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,2,1,power_law_1.2,2.399955177307129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,4,1,balanced,0.9655146598815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,4,1,balanced,0.9668746789296468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,4,1,power_law_1.01,1.3172800064086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,4,1,power_law_1.01,1.3296128273010255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,4,1,power_law_1.2,1.361945629119873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,4,1,power_law_1.2,1.3663104057312012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,8,1,balanced,0.8485066890716553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,8,1,balanced,0.8505173524220785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,8,1,power_law_1.01,0.9418432235717773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,8,1,power_law_1.01,0.9446911811828613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,8,1,power_law_1.2,0.9568384170532227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2048,8,256,8,1,power_law_1.2,0.9651391983032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,1,balanced,3.9911680221557617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,1,balanced,3.9912853240966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,1,power_law_1.01,4.385299301147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,1,power_law_1.01,4.403340911865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,1,power_law_1.2,4.464627075195312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,1,power_law_1.2,4.482912063598633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,16,balanced,0.7364426453908285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,16,balanced,0.7373759746551514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,16,power_law_1.01,0.8888128280639649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,16,power_law_1.01,0.9225279808044433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,16,power_law_1.2,0.9611583709716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,16,power_law_1.2,1.0245759963989258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,2,balanced,2.2786666552225747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,2,balanced,2.27893336613973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,2,power_law_1.01,2.543737602233887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,2,power_law_1.01,2.7379392623901366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,2,power_law_1.2,2.591212844848633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,2,power_law_1.2,2.653139114379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,32,balanced,0.61844801902771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,32,balanced,0.6191946665445963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,32,power_law_1.01,0.7898111820220948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,32,power_law_1.01,0.8031999588012695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,32,power_law_1.2,0.8445311546325683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,32,power_law_1.2,0.858886432647705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,4,balanced,1.3809547424316406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,4,balanced,1.3822612762451172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,4,power_law_1.01,1.5924287796020509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,4,power_law_1.01,1.6280895233154298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,4,power_law_1.2,1.7082176208496094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,4,power_law_1.2,1.7311935424804688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,8,balanced,0.9512693087259928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,8,balanced,0.9518773555755615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,8,power_law_1.01,1.1254079818725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,8,power_law_1.01,1.1494208335876466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,8,power_law_1.2,1.2362367630004882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,1,8,power_law_1.2,1.2995136260986329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,2,1,balanced,2.160325368245443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,2,1,balanced,2.1613547007242837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,2,1,power_law_1.01,2.369811248779297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,2,1,power_law_1.01,2.3886783599853514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,2,1,power_law_1.2,2.41976318359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,2,1,power_law_1.2,2.424787139892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,4,1,balanced,1.224128007888794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,4,1,balanced,1.2259039878845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,4,1,power_law_1.01,1.3467391967773437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,4,1,power_law_1.01,1.3536064147949218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,4,1,power_law_1.2,1.3586112022399903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,6144,2560,8,160,4,1,power_law_1.2,1.3626367568969726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,1,balanced,3.449274698893229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,1,balanced,3.4515679677327475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,1,power_law_1.01,4.906502532958984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,1,power_law_1.01,4.942067337036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,1,power_law_1.2,5.0696769714355465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,1,power_law_1.2,5.104787063598633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,128,balanced,0.5567306677500407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,128,balanced,0.5587360064188639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,128,power_law_1.01,0.6538943767547607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,128,power_law_1.01,0.6633088111877441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,128,power_law_1.2,0.6805888175964355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,128,power_law_1.2,0.6903808116912842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,16,balanced,0.7258133093516032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,16,balanced,0.7267466386159261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,16,power_law_1.01,0.9310527801513672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,16,power_law_1.01,0.9357695579528809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,16,power_law_1.2,0.9711296081542968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,16,power_law_1.2,1.0308799743652344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,2,balanced,2.0399413108825684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,2,balanced,2.040485382080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,2,power_law_1.01,2.839743995666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,2,power_law_1.01,2.8410688400268556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,2,power_law_1.2,2.8717056274414063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,2,power_law_1.2,2.9322368621826174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,256,balanced,0.547754685084025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,256,balanced,0.5504639943440756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,256,power_law_1.01,0.6104320049285888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,256,power_law_1.01,0.6111936092376709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,256,power_law_1.2,0.6612927913665771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,256,power_law_1.2,0.6640511989593506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,32,balanced,0.6301653385162354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,32,balanced,0.6302560170491537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,32,power_law_1.01,0.7782527923583984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,32,power_law_1.01,0.7951488018035888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,32,power_law_1.2,0.8036671638488769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,32,power_law_1.2,0.8574015617370605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,4,balanced,1.296837329864502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,4,balanced,1.2981706460316975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,4,power_law_1.01,1.7358720779418946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,4,power_law_1.01,1.7776063919067382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,4,power_law_1.2,1.8876352310180664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,4,power_law_1.2,1.9071231842041017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,64,balanced,0.5790293216705322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,64,balanced,0.5799093246459961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,64,power_law_1.01,0.6806272029876709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,64,power_law_1.01,0.6952832221984864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,64,power_law_1.2,0.7604735851287842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,64,power_law_1.2,0.7775872230529786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,8,balanced,0.8947733243306478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,8,balanced,0.8953493436177572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,8,power_law_1.01,1.2373056411743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,8,power_law_1.01,1.2743103981018067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,8,power_law_1.2,1.2836095809936523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,1,8,power_law_1.2,1.2955455780029297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,16,1,balanced,0.6007359822591146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,16,1,balanced,0.6010133425394694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,16,1,power_law_1.01,0.746457576751709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,16,1,power_law_1.01,0.7494016170501709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,16,1,power_law_1.2,0.8042943954467774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,16,1,power_law_1.2,0.8075008392333984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,2,1,balanced,1.9047253926595051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,2,1,balanced,1.9051574071248372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,2,1,power_law_1.01,2.6655359268188477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,2,1,power_law_1.01,2.681260871887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,2,1,power_law_1.2,2.779648017883301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,2,1,power_law_1.2,2.7903871536254883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,4,1,balanced,1.1113226413726807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,4,1,balanced,1.11190398534139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,4,1,power_law_1.01,1.5219776153564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,4,1,power_law_1.01,1.5236800193786622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,4,1,power_law_1.2,1.5613311767578124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,4,1,power_law_1.2,1.5820672035217285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,8,1,balanced,0.9976533253987631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,8,1,balanced,1.0019893646240234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,8,1,power_law_1.01,1.0888319969177247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,8,1,power_law_1.01,1.0894528388977052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,8,1,power_law_1.2,1.110585594177246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,256,8,1,power_law_1.2,1.1140416145324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,1,balanced,4.918944040934245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,1,balanced,4.921632130940755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,1,power_law_1.01,5.833164978027344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,1,power_law_1.01,5.849689483642578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,1,power_law_1.2,6.123360061645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,1,power_law_1.2,6.124236679077148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,128,balanced,0.6222399870554606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,128,balanced,0.6236533323923746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,128,power_law_1.01,0.6943999767303467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,128,power_law_1.01,0.6961023807525635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,128,power_law_1.2,0.7353024005889892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,128,power_law_1.2,0.7383872032165527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,16,balanced,0.8678507010142008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,16,balanced,0.8703359762827555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,16,power_law_1.01,1.0046079635620118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,16,power_law_1.01,1.0668736457824708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,16,power_law_1.2,1.0721983909606934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,16,power_law_1.2,1.086143970489502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,2,balanced,2.799706776936849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,2,balanced,2.799861272176107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,2,power_law_1.01,3.239744186401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,2,power_law_1.01,3.4248126983642577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,2,power_law_1.2,3.4725566864013673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,2,power_law_1.2,3.476838302612305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,32,balanced,0.7316906452178955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,32,balanced,0.7317226727803549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,32,power_law_1.01,0.8368063926696777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,32,power_law_1.01,0.8491647720336915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,32,power_law_1.2,0.8864383697509766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,32,power_law_1.2,0.8941503524780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,4,balanced,1.7023413976033528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,4,balanced,1.7060693105061848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,4,power_law_1.01,2.0285951614379885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,4,power_law_1.01,2.0745471954345702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,4,power_law_1.2,2.0993152618408204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,4,power_law_1.2,2.196544075012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,64,balanced,0.6560426553090414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,64,balanced,0.656607985496521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,64,power_law_1.01,0.7372799873352051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,64,power_law_1.01,0.7513408184051513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,64,power_law_1.2,0.7938240051269532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,64,power_law_1.2,0.8034751892089844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,8,balanced,1.1516319910685222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,8,balanced,1.1517493724822998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,8,power_law_1.01,1.3750080108642577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,8,power_law_1.01,1.3759743690490722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,8,power_law_1.2,1.396992015838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,1,8,power_law_1.2,1.4538047790527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,16,1,balanced,0.7808000246683756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,16,1,balanced,0.7838719685872396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,16,1,power_law_1.01,0.8951423645019532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,16,1,power_law_1.01,0.9046655654907226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,16,1,power_law_1.2,0.9090047836303711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,16,1,power_law_1.2,0.9183615684509278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,2,1,balanced,2.6674187978108725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,2,1,balanced,2.6695146560668945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,2,1,power_law_1.01,3.161292839050293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,2,1,power_law_1.01,3.1989696502685545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,2,1,power_law_1.2,3.3090625762939454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,2,1,power_law_1.2,3.3559295654296877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,4,1,balanced,1.5869706471761067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,4,1,balanced,1.5887999534606934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,4,1,power_law_1.01,1.853068733215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,4,1,power_law_1.01,1.8598079681396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,4,1,power_law_1.2,1.9231487274169923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,4,1,power_law_1.2,1.94006404876709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,8,1,balanced,1.045973300933838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,8,1,balanced,1.0466346740722656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,8,1,power_law_1.01,1.190553569793701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,8,1,power_law_1.01,1.2040960311889648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,8,1,power_law_1.2,1.2510592460632324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,2048,7168,2048,8,384,8,1,power_law_1.2,1.2537407875061035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,1,balanced,0.1520853340625763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,1,balanced,0.1525813341140747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,1,power_law_1.01,0.1753216028213501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,1,power_law_1.01,0.1756160020828247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,1,power_law_1.2,0.17786240577697754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,1,power_law_1.2,0.17971199750900269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,128,balanced,0.059232001503308616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,128,balanced,0.060405333836873375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,128,power_law_1.01,0.058208000659942624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,128,power_law_1.01,0.058950400352478026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,128,power_law_1.2,0.06032000184059143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,128,power_law_1.2,0.06072319746017456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,16,balanced,0.06635199983914693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,16,balanced,0.06651733318964641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,16,power_law_1.01,0.06660479903221131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,16,power_law_1.01,0.06875519752502442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,16,power_law_1.2,0.06683520078659058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,16,power_law_1.2,0.06895999908447266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,2,balanced,0.1483733355998993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,2,balanced,0.14983999729156494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,2,power_law_1.01,0.14885760545730592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,2,power_law_1.01,0.14998400211334229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,2,power_law_1.2,0.15180799961090088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,2,power_law_1.2,0.15323519706726074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,32,balanced,0.06216000020503998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,32,balanced,0.06282133360703786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,32,power_law_1.01,0.06242560148239136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,32,power_law_1.01,0.06264320015907288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,32,power_law_1.2,0.0625216007232666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,32,power_law_1.2,0.06295040249824524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,4,balanced,0.10916266838709514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,4,balanced,0.11027733484903972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,4,power_law_1.01,0.10795520544052124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,4,power_law_1.01,0.11047040224075318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,4,power_law_1.2,0.10871039628982544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,4,power_law_1.2,0.11065599918365479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,64,balanced,0.05938666562239329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,64,balanced,0.06126933296521505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,64,power_law_1.01,0.060185599327087405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,64,power_law_1.01,0.06113280057907104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,64,power_law_1.2,0.06069759726524353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,64,power_law_1.2,0.061382400989532473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,8,balanced,0.07423999905586243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,8,balanced,0.0766186664501826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,8,power_law_1.01,0.07704960107803345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,8,power_law_1.2,0.07672960162162781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,1,8,power_law_1.2,0.07752320170402527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,2,1,balanced,0.10982933640480042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,2,1,balanced,0.11137066284815471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,2,1,power_law_1.01,0.11570559740066529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,2,1,power_law_1.01,0.11585919857025147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,2,1,power_law_1.2,0.11669119596481323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,2048,768,8,128,2,1,power_law_1.2,0.11706880331039429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,1,balanced,1.0561599731445312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,1,balanced,1.0564853350321453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,1,power_law_1.01,0.9172672271728516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,1,power_law_1.01,0.922976016998291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,1,power_law_1.2,0.9147711753845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,1,power_law_1.2,0.9385984420776368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,128,balanced,0.11331199606259663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,128,balanced,0.11539199948310852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,128,power_law_1.01,0.11384320259094238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,128,power_law_1.01,0.11454720497131347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,128,power_law_1.2,0.1148800015449524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,128,power_law_1.2,0.11493120193481446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,16,balanced,0.17324799299240112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,16,balanced,0.1747786601384481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,16,power_law_1.01,0.1646463990211487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,16,power_law_1.01,0.16833920478820802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,16,power_law_1.2,0.1646656036376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,16,power_law_1.2,0.16677119731903076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,2,balanced,0.5883520046869913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,2,balanced,0.5884426832199097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,2,power_law_1.01,0.5350719928741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,2,power_law_1.01,0.5378111839294434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,2,power_law_1.2,0.521888017654419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,2,power_law_1.2,0.5346240043640137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,256,balanced,0.11146666606267293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,256,balanced,0.11242666840553284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,256,power_law_1.01,0.11100800037384033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,256,power_law_1.01,0.1112064003944397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,256,power_law_1.2,0.11208959817886352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,256,power_law_1.2,0.1122431993484497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,32,balanced,0.14010666807492575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,32,balanced,0.1421173314253489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,32,power_law_1.01,0.13687039613723756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,32,power_law_1.01,0.13756799697875977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,32,power_law_1.2,0.13432320356369018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,32,power_law_1.2,0.13918720483779906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,4,balanced,0.3567039966583252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,4,balanced,0.3569600184758504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,4,power_law_1.01,0.32077438831329347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,4,power_law_1.01,0.325548791885376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,4,power_law_1.2,0.31816959381103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,4,power_law_1.2,0.3263040065765381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,64,balanced,0.12396799524625142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,64,balanced,0.12572800119717917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,64,power_law_1.01,0.1214784026145935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,64,power_law_1.01,0.12323199510574341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,64,power_law_1.2,0.12208000421524048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,64,power_law_1.2,0.1225600004196167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,8,balanced,0.23538132508595785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,8,balanced,0.2362933357556661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,8,power_law_1.01,0.22196478843688966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,8,power_law_1.01,0.22410879135131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,8,power_law_1.2,0.21929600238800048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,1,8,power_law_1.2,0.22001280784606933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,2,1,balanced,0.5892693201700846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,2,1,balanced,0.5910933415095011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,2,1,power_law_1.01,0.5134272098541259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,2,1,power_law_1.01,0.516435194015503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,2,1,power_law_1.2,0.5275263786315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,2,1,power_law_1.2,0.5394495964050293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,4,1,balanced,0.35625600814819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,4,1,balanced,0.3569120168685913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,4,1,power_law_1.01,0.3124864101409912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,4,1,power_law_1.01,0.3133568048477173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,4,1,power_law_1.2,0.31468160152435304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,3072,1536,8,256,4,1,power_law_1.2,0.3157504081726074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,1,balanced,0.4925706783930461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,1,balanced,0.49426666895548504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,1,power_law_1.01,0.7001984119415283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,1,power_law_1.01,0.709164810180664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,1,power_law_1.2,0.7045375823974609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,1,power_law_1.2,0.7128448009490966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,2,balanced,0.36184000968933105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,2,balanced,0.3657333453496297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,2,power_law_1.01,0.4411007881164551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,2,power_law_1.01,0.4593984127044678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,2,power_law_1.2,0.4403711795806885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,2,power_law_1.2,0.4475264072418213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,4,balanced,0.29077865680058795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,4,balanced,0.2924000024795532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,4,power_law_1.01,0.3663552045822144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,4,power_law_1.01,0.3755903959274292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,4,power_law_1.2,0.3583103895187378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,4,power_law_1.2,0.36506879329681396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,8,balanced,0.25979199012120563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,8,balanced,0.26078933477401733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,8,power_law_1.01,0.3304383993148804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,8,power_law_1.01,0.33215999603271484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,8,power_law_1.2,0.3264960050582886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,1,8,power_law_1.2,0.33208959102630614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,16,1,balanced,0.08587200442949931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,16,1,balanced,0.08619733651479085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,16,1,power_law_1.01,0.08822399973869324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,16,1,power_law_1.01,0.08889600038528442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,16,1,power_law_1.2,0.09194239974021912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,16,1,power_law_1.2,0.09228159785270691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,2,1,balanced,0.28151466449101764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,2,1,balanced,0.28220266103744507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,2,1,power_law_1.01,0.3742847919464111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,2,1,power_law_1.01,0.37909119129180907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,2,1,power_law_1.2,0.3681855916976929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,2,1,power_law_1.2,0.3794048070907593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,4,1,balanced,0.1632480025291443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,4,1,balanced,0.16726932922999063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,4,1,power_law_1.01,0.21865599155426024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,4,1,power_law_1.01,0.21943039894104005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,4,1,power_law_1.2,0.2185920000076294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,4,1,power_law_1.2,0.21877760887145997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,8,1,balanced,0.10110400120417277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,8,1,balanced,0.10212799906730652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,8,1,power_law_1.01,0.1457856059074402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,8,1,power_law_1.01,0.14592000246047973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,8,1,power_law_1.2,0.14507520198822021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,14336,2,8,8,1,power_law_1.2,0.1454208016395569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,1,balanced,0.7272853056589762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,1,balanced,0.7290346622467041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,1,power_law_1.01,0.7391039848327636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,1,power_law_1.01,0.7422719955444336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,1,power_law_1.2,0.751091194152832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,1,power_law_1.2,0.7638783931732178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,128,balanced,0.10043199857076009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,128,balanced,0.10168533523877461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,128,power_law_1.01,0.10277119874954224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,128,power_law_1.01,0.10484479665756226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,128,power_law_1.2,0.10276479721069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,128,power_law_1.2,0.10793600082397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,16,balanced,0.1325493355592092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,16,balanced,0.13320533434549967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,16,power_law_1.01,0.132697594165802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,16,power_law_1.01,0.13715200424194335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,16,power_law_1.2,0.13831679821014403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,16,power_law_1.2,0.13868160247802735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,2,balanced,0.42661865552266437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,2,balanced,0.4270346562067668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,2,power_law_1.01,0.4270656108856201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,2,power_law_1.01,0.43300480842590333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,2,power_law_1.2,0.4302656173706055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,2,power_law_1.2,0.43452157974243166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,32,balanced,0.12141333023707072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,32,balanced,0.12191466490427653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,32,power_law_1.01,0.11962239742279053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,32,power_law_1.01,0.12058240175247192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,32,power_law_1.2,0.12101119756698608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,32,power_law_1.2,0.12244479656219483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,4,balanced,0.2544586658477783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,4,balanced,0.25517867008845013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,4,power_law_1.01,0.26326398849487304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,4,power_law_1.01,0.2671744108200073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,4,power_law_1.2,0.26752638816833496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,4,power_law_1.2,0.27041919231414796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,64,balanced,0.11401066184043884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,64,balanced,0.11402133107185364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,64,power_law_1.01,0.11335680484771729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,64,power_law_1.01,0.11600639820098876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,64,power_law_1.2,0.11438080072402954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,64,power_law_1.2,0.11463680267333984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,8,balanced,0.1818079948425293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,8,balanced,0.18347734212875366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,8,power_law_1.01,0.18184959888458252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,8,power_law_1.01,0.1824447989463806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,8,power_law_1.2,0.18408960103988647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,1,8,power_law_1.2,0.18757760524749756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,2,1,balanced,0.25546665986378986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,2,1,balanced,0.2563520073890686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,2,1,power_law_1.01,0.30782079696655273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,2,1,power_law_1.01,0.3083584070205688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,2,1,power_law_1.2,0.3108992099761963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,2,1,power_law_1.2,0.3129856109619141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,4,1,balanced,0.17691200971603394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,4,1,balanced,0.1772586703300476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,4,1,power_law_1.01,0.19333120584487914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,4,1,power_law_1.01,0.19474560022354126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,4,1,power_law_1.2,0.19630719423294068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,1536,8,128,4,1,power_law_1.2,0.19657599925994873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,1,balanced,4.562965393066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,1,balanced,4.566522598266602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,1,power_law_1.01,4.17283821105957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,1,power_law_1.01,4.231679916381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,1,power_law_1.2,4.4281982421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,1,power_law_1.2,4.440256118774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,128,balanced,0.3625653187433879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,128,balanced,0.36325867970784503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,128,power_law_1.01,0.35939199924468995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,128,power_law_1.01,0.3602816104888916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,128,power_law_1.2,0.36459519863128664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,128,power_law_1.2,0.3724544048309326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,16,balanced,0.6088320016860962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,16,balanced,0.6120906670888265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,16,power_law_1.01,0.594214391708374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,16,power_law_1.01,0.6020736217498779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,16,power_law_1.2,0.6224639892578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,16,power_law_1.2,0.623583984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,2,balanced,2.4711786905924478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,2,balanced,2.472047964731852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,2,power_law_1.01,2.3040128707885743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,2,power_law_1.01,2.306713676452637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,2,power_law_1.2,2.3785600662231445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,2,power_law_1.2,2.4093759536743162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,256,balanced,0.3442666530609131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,256,balanced,0.3455093304316203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,256,power_law_1.01,0.3435328006744385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,256,power_law_1.01,0.343884801864624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,256,power_law_1.2,0.3536704063415527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,256,power_law_1.2,0.35459198951721194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,32,balanced,0.47375468413035077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,32,balanced,0.474021315574646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,32,power_law_1.01,0.46225919723510744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,32,power_law_1.01,0.47097601890563967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,32,power_law_1.2,0.473689603805542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,32,power_law_1.2,0.47954559326171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,4,balanced,1.4110506375630696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,4,balanced,1.4143733978271484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,4,power_law_1.01,1.313708782196045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,4,power_law_1.01,1.3142399787902832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,4,power_law_1.2,1.377894401550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,4,power_law_1.2,1.4027135848999024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,64,balanced,0.40622933705647785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,64,balanced,0.4065653483072917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,64,power_law_1.01,0.4012671947479248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,64,power_law_1.01,0.40375680923461915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,64,power_law_1.2,0.414412784576416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,64,power_law_1.2,0.41536641120910645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,8,balanced,0.8820746739705404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,8,balanced,0.8844426472981771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,8,power_law_1.01,0.8253567695617676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,8,power_law_1.01,0.8347071647644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,8,power_law_1.2,0.8703424453735351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,4096,2688,22,512,1,8,power_law_1.2,0.8760191917419433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,1,balanced,0.816800038019816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,1,balanced,0.8175466855367025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,1,power_law_1.01,1.094099235534668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,1,power_law_1.01,1.1361663818359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,1,power_law_1.2,1.084665584564209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,1,power_law_1.2,1.128121566772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,2,balanced,0.48659733931223553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,2,balanced,0.48770666122436523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,2,power_law_1.01,0.7627456188201904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,2,power_law_1.01,0.7874048233032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,2,power_law_1.2,0.7737343788146973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,2,power_law_1.2,0.7741248130798339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,4,balanced,0.36511464913686115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,4,balanced,0.3673280080159505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,4,power_law_1.01,0.48665599822998046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,4,power_law_1.01,0.51560959815979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,4,power_law_1.2,0.4864192008972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,4,power_law_1.2,0.5046720027923584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,8,balanced,0.31860800584157306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,8,balanced,0.318725327650706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,8,power_law_1.01,0.41454081535339354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,8,power_law_1.01,0.44325761795043944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,8,power_law_1.2,0.42378878593444824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,1,8,power_law_1.2,0.4328127861022949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,16,1,balanced,0.11845333377520244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,16,1,balanced,0.12334932883580525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,16,1,power_law_1.01,0.12463359832763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,16,1,power_law_1.01,0.125600004196167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,16,1,power_law_1.2,0.12257920503616333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,16,1,power_law_1.2,0.12302080392837525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,2,1,balanced,0.45181866486867267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,2,1,balanced,0.45211732387542725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,2,1,power_law_1.01,0.5354879856109619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,2,1,power_law_1.01,0.5856192111968994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,2,1,power_law_1.2,0.6045055866241456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,2,1,power_law_1.2,0.6065343856811524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,32,1,balanced,0.09842133522033691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,32,1,balanced,0.10512533783912659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,32,1,power_law_1.01,0.10288000106811523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,32,1,power_law_1.01,0.10473599433898925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,32,1,power_law_1.2,0.1044927954673767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,32,1,power_law_1.2,0.10496000051498414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,4,1,balanced,0.2485599915186564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,4,1,balanced,0.2490346630414327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,4,1,power_law_1.01,0.312064003944397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,4,1,power_law_1.01,0.3395391941070557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,4,1,power_law_1.2,0.32480640411376954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,4,1,power_law_1.2,0.3322943925857544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,8,1,balanced,0.1444906691710154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,8,1,balanced,0.1453333298365275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,8,1,power_law_1.01,0.20135679244995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,8,1,power_law_1.01,0.2075455904006958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,8,1,power_law_1.2,0.20135679244995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,16384,2,8,8,1,power_law_1.2,0.20682239532470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,1,balanced,2.5920586585998535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,1,balanced,2.592319965362549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,1,power_law_1.01,2.2641408920288084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,1,power_law_1.01,2.2907007217407225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,1,power_law_1.2,2.299488067626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,1,power_law_1.2,2.317100715637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,128,balanced,0.18789867560068765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,128,balanced,0.19249600172042847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,128,power_law_1.01,0.18837120532989501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,128,power_law_1.01,0.18878079652786256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,128,power_law_1.2,0.18817280530929564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,128,power_law_1.2,0.18972159624099733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,16,balanced,0.32411734263102215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,16,balanced,0.32573866844177246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,16,power_law_1.01,0.30487039089202883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,16,power_law_1.01,0.3056191921234131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,16,power_law_1.2,0.3130176067352295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,16,power_law_1.2,0.3151999950408936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,2,balanced,1.3820959726969402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,2,balanced,1.3835733731587727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,2,power_law_1.01,1.1981632232666015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,2,power_law_1.01,1.226534366607666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,2,power_law_1.2,1.226419162750244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,2,power_law_1.2,1.2665792465209962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,256,balanced,0.18496533234914145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,256,balanced,0.18505066633224487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,256,power_law_1.01,0.18176640272140504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,256,power_law_1.01,0.18268799781799316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,256,power_law_1.2,0.1827072024345398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,256,power_law_1.2,0.1837183952331543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,32,balanced,0.24833067258199057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,32,balanced,0.24848000208536783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,32,power_law_1.01,0.23725440502166747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,32,power_law_1.01,0.24401280879974366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,32,power_law_1.2,0.23911681175231933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,32,power_law_1.2,0.24465279579162597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,4,balanced,0.7838826974232992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,4,balanced,0.7845226923624674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,4,power_law_1.01,0.7153024196624755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,4,power_law_1.01,0.7370816230773926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,4,power_law_1.2,0.6937856197357177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,4,power_law_1.2,0.7142335891723632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,64,balanced,0.2042293349901835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,64,balanced,0.20478934049606323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,64,power_law_1.01,0.20177919864654542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,64,power_law_1.01,0.20366079807281495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,64,power_law_1.2,0.19838720560073853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,64,power_law_1.2,0.20471038818359374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,8,balanced,0.48188801606496173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,8,balanced,0.48203734556833905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,8,power_law_1.01,0.45199360847473147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,8,power_law_1.01,0.47361278533935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,8,power_law_1.2,0.4386943817138672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,1,8,power_law_1.2,0.45679359436035155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,16,1,balanced,0.3567519982655843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,16,1,balanced,0.35698668162027997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,16,1,power_law_1.01,0.3336512088775635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,16,1,power_law_1.01,0.33422720432281494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,16,1,power_law_1.2,0.33521280288696287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,16,1,power_law_1.2,0.33585920333862307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,2,1,balanced,1.3816639582316081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,2,1,balanced,1.383562723795573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,2,1,power_law_1.01,1.2224255561828614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,2,1,power_law_1.01,1.2278079986572266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,2,1,power_law_1.2,1.231494426727295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,2,1,power_law_1.2,1.231545639038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,4,1,balanced,0.4779680172602336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,4,1,balanced,0.4784586826960246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,4,1,power_law_1.01,0.4480639934539795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,4,1,power_law_1.01,0.4493247985839844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,4,1,power_law_1.2,0.4589888095855713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,4,1,power_law_1.2,0.47043838500976565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,8,1,balanced,0.30378133058547974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,8,1,balanced,0.30526934067408246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,8,1,power_law_1.01,0.2927743911743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,8,1,power_law_1.01,0.2936320066452026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,8,1,power_law_1.2,0.29377920627593995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2048,8,256,8,1,power_law_1.2,0.300435209274292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,1,balanced,2.057098706563314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,1,balanced,2.0588587125142417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,1,power_law_1.01,1.9568191528320313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,1,power_law_1.01,1.9824703216552735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,1,power_law_1.2,2.0150400161743165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,1,power_law_1.2,2.0430784225463867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,16,balanced,0.27109332879384357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,16,balanced,0.2736480037371318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,16,power_law_1.01,0.2649791955947876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,16,power_law_1.01,0.2724672079086304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,16,power_law_1.2,0.27822721004486084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,16,power_law_1.2,0.27947518825531004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,2,balanced,1.1022506554921467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,2,balanced,1.1029706796010335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,2,power_law_1.01,1.0471872329711913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,2,power_law_1.01,1.0897791862487793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,2,power_law_1.2,1.1037311553955078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,2,power_law_1.2,1.1133312225341796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,32,balanced,0.20351467529932657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,32,balanced,0.204858660697937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,32,power_law_1.01,0.20633599758148194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,32,power_law_1.01,0.2066943883895874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,32,power_law_1.2,0.21841280460357665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,32,power_law_1.2,0.22121601104736327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,4,balanced,0.6252853473027548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,4,balanced,0.6263253291447958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,4,power_law_1.01,0.6063807964324951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,4,power_law_1.01,0.6138304233551025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,4,power_law_1.2,0.6215616226196289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,4,power_law_1.2,0.6529280185699463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,8,balanced,0.38808000087738037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,8,balanced,0.38862399260203045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,8,power_law_1.01,0.38366720676422117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,8,power_law_1.01,0.3844095945358276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,8,power_law_1.2,0.3883392095565796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,1,8,power_law_1.2,0.3999871969223022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,2,1,balanced,1.0956426461537678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,2,1,balanced,1.0958399772644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,2,1,power_law_1.01,1.0556096076965331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,2,1,power_law_1.01,1.0651328086853027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,2,1,power_law_1.2,1.0973888397216798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,2,1,power_law_1.2,1.1207039833068848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,4,1,balanced,0.3768053452173869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,4,1,balanced,0.37748265266418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,4,1,power_law_1.01,0.42200322151184083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,4,1,power_law_1.01,0.42627840042114257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,4,1,power_law_1.2,0.4299007892608643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,6144,2560,8,160,4,1,power_law_1.2,0.43086719512939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,1,balanced,3.0139201482137046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,1,balanced,3.016794522603353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,1,power_law_1.01,2.564627265930176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,1,power_law_1.01,2.6714815139770507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,1,power_law_1.2,2.6210559844970702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,1,power_law_1.2,2.7289600372314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,128,balanced,0.21398399273554483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,128,balanced,0.21438399950663248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,128,power_law_1.01,0.2132416009902954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,128,power_law_1.01,0.2135103940963745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,128,power_law_1.2,0.21344640254974365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,128,power_law_1.2,0.2136064052581787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,16,balanced,0.3645333449045817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,16,balanced,0.3656959931055705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,16,power_law_1.01,0.33848960399627687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,16,power_law_1.01,0.34717440605163574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,16,power_law_1.2,0.3464832067489624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,16,power_law_1.2,0.34848001003265383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,2,balanced,1.6019360224405925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,2,balanced,1.6021706263224285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,2,power_law_1.01,1.3760191917419433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,2,power_law_1.01,1.3790656089782716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,2,power_law_1.2,1.4291775703430176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,2,power_law_1.2,1.4435199737548827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,256,balanced,0.2083253264427185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,256,balanced,0.209007998307546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,256,power_law_1.01,0.2067392110824585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,256,power_law_1.01,0.2072000026702881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,256,power_law_1.2,0.20607359409332277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,256,power_law_1.2,0.20739200115203857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,32,balanced,0.27347733577092487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,32,balanced,0.2752479910850525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,32,power_law_1.01,0.2700160026550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,32,power_law_1.01,0.2737407922744751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,32,power_law_1.2,0.2702143907546997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,32,power_law_1.2,0.2716480016708374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,4,balanced,0.9002880255381266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,4,balanced,0.900714635848999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,4,power_law_1.01,0.8130368232727051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,4,power_law_1.01,0.8269760131835937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,4,power_law_1.2,0.8366144180297852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,4,power_law_1.2,0.8466815948486328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,64,balanced,0.22634132703145346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,64,balanced,0.22848532597223917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,64,power_law_1.01,0.2233344078063965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,64,power_law_1.01,0.2244352102279663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,64,power_law_1.2,0.2253567934036255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,64,power_law_1.2,0.22561280727386473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,8,balanced,0.5534826517105103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,8,balanced,0.5543520053227743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,8,power_law_1.01,0.507916784286499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,8,power_law_1.01,0.5152768135070801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,8,power_law_1.2,0.4959424018859863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,1,8,power_law_1.2,0.5390783786773682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,16,1,balanced,0.41069865226745605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,16,1,balanced,0.4116426706314087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,16,1,power_law_1.01,0.3846656084060669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,16,1,power_law_1.01,0.3846911907196045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,16,1,power_law_1.2,0.38587520122528074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,16,1,power_law_1.2,0.3874943971633911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,2,1,balanced,1.6075733502705891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,2,1,balanced,1.610047976175944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,2,1,power_law_1.01,1.3927680015563966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,2,1,power_law_1.01,1.4018048286437987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,2,1,power_law_1.2,1.4071999549865724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,2,1,power_law_1.2,1.4521984100341796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,4,1,balanced,0.5502400000890096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,4,1,balanced,0.5510559876759847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,4,1,power_law_1.01,0.5185408115386962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,4,1,power_law_1.01,0.5200704097747803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,4,1,power_law_1.2,0.5204544067382812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,4,1,power_law_1.2,0.5303872108459473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,8,1,balanced,0.34931198755900067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,8,1,balanced,0.34967998663584393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,8,1,power_law_1.01,0.33686399459838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,8,1,power_law_1.01,0.33974399566650393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,8,1,power_law_1.2,0.3369343996047974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,256,8,1,power_law_1.2,0.3418495893478394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,1,balanced,4.447253227233887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,1,balanced,4.449082692464192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,1,power_law_1.01,3.5590656280517576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,1,power_law_1.01,3.6118465423583985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,1,power_law_1.2,3.5319934844970704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,1,power_law_1.2,3.597216033935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,128,balanced,0.26708267132441205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,128,balanced,0.26799466212590534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,128,power_law_1.01,0.26496639251708987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,128,power_law_1.01,0.26499199867248535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,128,power_law_1.2,0.2630399942398071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,128,power_law_1.2,0.2673664093017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,16,balanced,0.5064853429794312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,16,balanced,0.5080480178197225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,16,power_law_1.01,0.46648321151733396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,16,power_law_1.01,0.4812096118927002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,16,power_law_1.2,0.4675327777862549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,16,power_law_1.2,0.4840703964233398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,2,balanced,2.3438186645507812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,2,balanced,2.3440906206766763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,2,power_law_1.01,1.9505855560302734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,2,power_law_1.01,1.971174430847168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,2,power_law_1.2,1.9013952255249023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,2,power_law_1.2,1.9402559280395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,32,balanced,0.37555734316507977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,32,balanced,0.37592001756032306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,32,power_law_1.01,0.3531199932098389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,32,power_law_1.01,0.3588671922683716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,32,power_law_1.2,0.343667197227478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,32,power_law_1.2,0.3591423988342285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,4,balanced,1.2971519629160564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,4,balanced,1.3017226854960124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,4,power_law_1.01,1.069919967651367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,4,power_law_1.01,1.1279680252075195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,4,power_law_1.2,1.0617600440979005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,4,power_law_1.2,1.0803647994995118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,64,balanced,0.3036746581395467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,64,balanced,0.3055093288421631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,64,power_law_1.01,0.2970240116119385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,64,power_law_1.01,0.29719679355621337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,64,power_law_1.2,0.2897279977798462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,64,power_law_1.2,0.3022592067718506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,8,balanced,0.7748586336771647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,8,balanced,0.7753173510233561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,8,power_law_1.01,0.6742208003997803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,8,power_law_1.01,0.6868991851806641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,8,power_law_1.2,0.67674880027771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,1,8,power_law_1.2,0.7048255920410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,16,1,balanced,0.33371734619140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,16,1,balanced,0.33553067843119305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,16,1,power_law_1.01,0.3006655931472778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,16,1,power_law_1.01,0.30217599868774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,16,1,power_law_1.2,0.29563519954681394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,16,1,power_law_1.2,0.2961280107498169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,2,1,balanced,2.360469341278076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,2,1,balanced,2.360736052195231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,2,1,power_law_1.01,1.9176511764526367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,2,1,power_law_1.01,1.9347200393676758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,2,1,power_law_1.2,1.915123176574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,2,1,power_law_1.2,1.9440576553344726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,4,1,balanced,1.3419893582661946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,4,1,balanced,1.3420532544453938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,4,1,power_law_1.01,1.1154175758361817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,4,1,power_law_1.01,1.1264639854431153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,4,1,power_law_1.2,1.1123071670532227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,4,1,power_law_1.2,1.115833568572998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,8,1,balanced,0.4715253512064616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,8,1,balanced,0.47276798884073895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,8,1,power_law_1.01,0.4201663970947266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,8,1,power_law_1.01,0.42800002098083495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,8,1,power_law_1.2,0.418943977355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,256,7168,2048,8,384,8,1,power_law_1.2,0.4260416030883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,1,balanced,0.6788053512573242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,1,balanced,0.6794400215148926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,1,power_law_1.01,0.7571455955505371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,1,power_law_1.01,0.7576831817626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,1,power_law_1.2,0.7597439765930176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,1,power_law_1.2,0.7631999969482421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,128,balanced,0.2644266684850057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,128,balanced,0.2648800015449524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,128,power_law_1.01,0.28470399379730227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,128,power_law_1.01,0.285696005821228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,128,power_law_1.2,0.3019776105880737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,128,power_law_1.2,0.30383360385894775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,16,balanced,0.2908053398132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,16,balanced,0.2909226616223653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,16,power_law_1.01,0.3273920059204102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,16,power_law_1.01,0.329036808013916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,16,power_law_1.2,0.33911681175231934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,16,power_law_1.2,0.34875519275665284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,2,balanced,0.4960213502248128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,2,balanced,0.4977866808573405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,2,power_law_1.01,0.5422016143798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,2,power_law_1.01,0.5495039939880371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,2,power_law_1.2,0.5701119899749756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,2,power_law_1.2,0.581382417678833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,32,balanced,0.2738666733105977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,32,balanced,0.27591466903686523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,32,power_law_1.01,0.3081279993057251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,32,power_law_1.01,0.30988800525665283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,32,power_law_1.2,0.3213696002960205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,32,power_law_1.2,0.3255039930343628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,4,balanced,0.379749337832133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,4,balanced,0.38089601198832196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,4,power_law_1.01,0.4242368221282959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,4,power_law_1.01,0.436902379989624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,4,power_law_1.2,0.4340223789215088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,4,power_law_1.2,0.4417407989501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,64,balanced,0.2672746578852336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,64,balanced,0.26737600564956665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,64,power_law_1.01,0.2953536033630371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,64,power_law_1.01,0.29857919216156004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,64,power_law_1.2,0.3067967891693115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,64,power_law_1.2,0.3079744100570679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,8,balanced,0.3203466733296712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,8,balanced,0.3208266695340474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,8,power_law_1.01,0.3679231882095337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,8,power_law_1.01,0.3706559896469116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,8,power_law_1.2,0.3682559967041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,1,8,power_law_1.2,0.3780352115631104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,2,1,balanced,0.4206133286158244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,2,1,balanced,0.42110931873321533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,2,1,power_law_1.01,0.4683328151702881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,2,1,power_law_1.01,0.4694528102874756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,2,1,power_law_1.2,0.46862077713012695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,2048,768,8,128,2,1,power_law_1.2,0.46952319145202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,1,balanced,2.148805300394694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,1,balanced,2.1503626505533853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,1,power_law_1.01,2.267283248901367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,1,power_law_1.01,2.2734912872314452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,1,power_law_1.2,2.3129215240478516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,1,power_law_1.2,2.337855911254883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,128,balanced,0.45049067338307697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,128,balanced,0.45158934593200684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,128,power_law_1.01,0.4884479999542236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,128,power_law_1.01,0.4948671817779541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,128,power_law_1.2,0.519385576248169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,128,power_law_1.2,0.5222015857696534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,16,balanced,0.5497066577275594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,16,balanced,0.5500266551971436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,16,power_law_1.01,0.6195519924163818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,16,power_law_1.01,0.6420479774475097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,16,power_law_1.2,0.6483967781066895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,16,power_law_1.2,0.649561595916748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,2,balanced,1.3210879961649578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,2,balanced,1.321237325668335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,2,power_law_1.01,1.4018495559692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,2,power_law_1.01,1.4026368141174317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,2,power_law_1.2,1.4460672378540038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,2,power_law_1.2,1.4512384414672852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,256,balanced,0.44489065806070965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,256,balanced,0.4456799825032552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,256,power_law_1.01,0.47535362243652346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,256,power_law_1.01,0.4758016109466553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,256,power_law_1.2,0.5054656028747558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,256,power_law_1.2,0.5080895900726319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,32,balanced,0.4923520088195801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,32,balanced,0.49505066871643066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,32,power_law_1.01,0.5556096076965332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,32,power_law_1.01,0.5592000007629394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,32,power_law_1.2,0.572870397567749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,32,power_law_1.2,0.6029439926147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,4,balanced,0.8845012982686361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,4,balanced,0.8846080303192139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,4,power_law_1.01,0.9661503791809082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,4,power_law_1.01,0.9759167671203614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,4,power_law_1.2,0.9953984260559082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,4,power_law_1.2,1.0392191886901856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,64,balanced,0.4659413496653239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,64,balanced,0.4660000006357829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,64,power_law_1.01,0.510745620727539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,64,power_law_1.01,0.5204800128936767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,64,power_law_1.2,0.5364607810974121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,64,power_law_1.2,0.5429696083068848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,8,balanced,0.6642239888509115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,8,balanced,0.6657013495763143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,8,power_law_1.01,0.743398380279541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,8,power_law_1.01,0.7608128070831299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,8,power_law_1.2,0.7660287857055664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,1,8,power_law_1.2,0.7966080188751221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,2,1,balanced,1.2184373537699382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,2,1,balanced,1.2202186584472656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,2,1,power_law_1.01,1.2764991760253905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,2,1,power_law_1.01,1.2789183616638184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,2,1,power_law_1.2,1.308243179321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,2,1,power_law_1.2,1.3154751777648925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,4,1,balanced,0.7533653577168783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,4,1,balanced,0.7539040247599283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,4,1,power_law_1.01,0.7843200206756592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,4,1,power_law_1.01,0.786348819732666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,4,1,power_law_1.2,0.7935296058654785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,3072,1536,8,256,4,1,power_law_1.2,0.795308780670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,1,balanced,4.271701176961263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,1,balanced,4.27232011159261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,1,power_law_1.01,4.330073547363281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,1,power_law_1.01,4.380460739135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,1,power_law_1.2,4.302272033691406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,1,power_law_1.2,4.330739212036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,2,balanced,2.509226640065511
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,2,balanced,2.5133973757425943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,2,power_law_1.01,3.053126335144043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,2,power_law_1.01,3.190726470947266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,2,power_law_1.2,2.7637823104858397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,2,power_law_1.2,2.808652877807617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,4,balanced,1.5601280530293782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,4,balanced,1.561482588450114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,4,power_law_1.01,2.431007957458496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,4,power_law_1.01,2.699257659912109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,4,power_law_1.2,2.576083183288574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,4,power_law_1.2,2.736134338378906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,8,balanced,1.1454933484395344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,8,balanced,1.145690679550171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,8,power_law_1.01,2.2779903411865234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,8,power_law_1.01,2.363033676147461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,8,power_law_1.2,2.4002496719360353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,1,8,power_law_1.2,2.435750389099121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,16,1,balanced,0.3758293390274048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,16,1,balanced,0.3758506774902344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,16,1,power_law_1.01,0.3759360074996948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,16,1,power_law_1.01,0.3767935991287231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,16,1,power_law_1.2,0.36895999908447263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,16,1,power_law_1.2,0.3783616065979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,2,1,balanced,2.1705066363016763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,2,1,balanced,2.1728639602661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,2,1,power_law_1.01,2.197305679321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,2,1,power_law_1.01,2.207436752319336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,2,1,power_law_1.2,2.1975616455078124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,2,1,power_law_1.2,2.2001535415649416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,4,1,balanced,1.1459360122680664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,4,1,balanced,1.1469173431396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,4,1,power_law_1.01,1.1526592254638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,4,1,power_law_1.01,1.1643391609191895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,4,1,power_law_1.2,1.1474559783935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,4,1,power_law_1.2,1.156704044342041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,8,1,balanced,0.6304800113042196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,8,1,balanced,0.6310826539993286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,8,1,power_law_1.01,0.6336895942687988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,8,1,power_law_1.01,0.6363647937774658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,8,1,power_law_1.2,0.6253056049346923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,14336,2,8,8,1,power_law_1.2,0.6318719863891602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,1,balanced,2.1188586552937827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,1,balanced,2.119727929433187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,1,power_law_1.01,2.4200639724731445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,1,power_law_1.01,2.426265525817871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,1,power_law_1.2,2.4145408630371095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,1,power_law_1.2,2.4527231216430665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,128,balanced,0.47325332959493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,128,balanced,0.474021315574646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,128,power_law_1.01,0.5542272090911865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,128,power_law_1.01,0.5579071998596191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,128,power_law_1.2,0.611897611618042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,128,power_law_1.2,0.6248000144958497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,16,balanced,0.5679893493652344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,16,balanced,0.5696906646092733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,16,power_law_1.01,0.6703616142272949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,16,power_law_1.01,0.6899712085723877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,16,power_law_1.2,0.7229055881500244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,16,power_law_1.2,0.7675456047058106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,2,balanced,1.319386641184489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,2,balanced,1.3199520111083984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,2,power_law_1.01,1.5266431808471679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,2,power_law_1.01,1.5555071830749512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,2,power_law_1.2,1.5576383590698242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,2,power_law_1.2,1.580134391784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,32,balanced,0.514901320139567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,32,balanced,0.5151520172754923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,32,power_law_1.01,0.6198463916778565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,32,power_law_1.01,0.6268671989440918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,32,power_law_1.2,0.6880447864532471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,32,power_law_1.2,0.7400576114654541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,4,balanced,0.8924533526102701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,4,balanced,0.8944799900054932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,4,power_law_1.01,1.1341119766235352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,4,power_law_1.01,1.134598445892334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,4,power_law_1.2,1.1005439758300781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,4,power_law_1.2,1.1194815635681152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,64,balanced,0.4848266839981079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,64,balanced,0.48689599831899005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,64,power_law_1.01,0.5734528064727783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,64,power_law_1.01,0.5938111782073975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,64,power_law_1.2,0.6417535781860352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,64,power_law_1.2,0.6592832088470459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,8,balanced,0.6784533659617106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,8,balanced,0.6790560086568197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,8,power_law_1.01,0.8376895904541015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,8,power_law_1.01,0.855731201171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,8,power_law_1.2,0.8408639907836915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,1,8,power_law_1.2,0.9299200057983399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,2,1,balanced,1.1974879900614421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,2,1,balanced,1.1980693340301514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,2,1,power_law_1.01,1.3451456069946288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,2,1,power_law_1.01,1.3475263595581055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,2,1,power_law_1.2,1.3559295654296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,2,1,power_law_1.2,1.3606464385986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,4,1,balanced,0.7429599761962891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,4,1,balanced,0.7429920037587484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,4,1,power_law_1.01,0.8341952323913574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,4,1,power_law_1.01,0.8376064300537109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,4,1,power_law_1.2,0.8284671783447266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,1536,8,128,4,1,power_law_1.2,0.8326335906982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,1,balanced,13.07030995686849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,1,balanced,13.075120290120443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,1,power_law_1.01,11.986259460449219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,1,power_law_1.01,12.03289566040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,1,power_law_1.2,12.157772827148438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,1,power_law_1.2,12.22208023071289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,128,balanced,1.777034600575765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,128,balanced,1.778341293334961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,128,power_law_1.01,1.9297151565551758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,128,power_law_1.01,1.9624128341674805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,128,power_law_1.2,2.035788726806641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,128,power_law_1.2,2.038547134399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,16,balanced,2.4144800504048667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,16,balanced,2.418288071950277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,16,power_law_1.01,2.569523239135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,16,power_law_1.01,2.6159360885620115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,16,power_law_1.2,2.701356887817383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,16,power_law_1.2,2.8613056182861327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,2,balanced,7.454501469930013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,2,balanced,7.455088297526042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,2,power_law_1.01,7.152812957763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,2,power_law_1.01,7.183942413330078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,2,power_law_1.2,7.213337707519531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,2,power_law_1.2,7.294649505615235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,256,balanced,1.7310560544331868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,256,balanced,1.7369492848714192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,256,power_law_1.01,1.8760383605957032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,256,power_law_1.01,1.880678367614746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,256,power_law_1.2,1.9600128173828124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,256,power_law_1.2,1.9856639862060548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,32,balanced,2.0520426432291665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,32,balanced,2.0538454055786133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,32,power_law_1.01,2.237459182739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,32,power_law_1.01,2.2683008193969725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,32,power_law_1.2,2.3206975936889647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,32,power_law_1.2,2.4030080795288087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,4,balanced,4.578799883524577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,4,balanced,4.580277442932129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,4,power_law_1.01,4.595833587646484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,4,power_law_1.01,4.632812881469727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,4,power_law_1.2,4.581644821166992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,4,power_law_1.2,4.820806503295898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,64,balanced,1.8668640454610188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,64,balanced,1.8748373985290527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,64,power_law_1.01,2.040140724182129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,64,power_law_1.01,2.0542144775390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,64,power_law_1.2,2.1514047622680663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,64,power_law_1.2,2.178771209716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,8,balanced,3.141167958577474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,8,balanced,3.147674560546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,8,power_law_1.01,3.222137451171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,8,power_law_1.01,3.260569763183594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,8,power_law_1.2,3.3948223114013674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,4096,2688,22,512,1,8,power_law_1.2,3.476601409912109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,1,balanced,6.842671712239583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,1,balanced,6.842682520548503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,1,power_law_1.01,7.008000183105469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,1,power_law_1.01,7.05389404296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,1,power_law_1.2,7.028594970703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,1,power_law_1.2,7.036390686035157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,2,balanced,3.8058932622273765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,2,balanced,3.8066027959187827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,2,power_law_1.01,4.5773567199707035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,2,power_law_1.01,4.628716659545899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,2,power_law_1.2,4.537286376953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,2,power_law_1.2,4.716460800170898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,4,balanced,2.249231974283854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,4,balanced,2.2509973843892417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,4,power_law_1.01,3.7167423248291014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,4,power_law_1.01,3.875539016723633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,4,power_law_1.2,3.861420822143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,4,power_law_1.2,3.91976318359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,8,balanced,1.4938027064005535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,8,balanced,1.4947412808736165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,8,power_law_1.01,3.1649023056030274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,8,power_law_1.01,3.4046142578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,8,power_law_1.2,3.672415924072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,1,8,power_law_1.2,3.6832958221435548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,16,1,balanced,0.5951360066731771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,16,1,balanced,0.5962346792221069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,16,1,power_law_1.01,0.5860288143157959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,16,1,power_law_1.01,0.5969535827636718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,16,1,power_law_1.2,0.5847616195678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,16,1,power_law_1.2,0.5932928085327148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,2,1,balanced,3.478351910909017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,2,1,balanced,3.4837706883748374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,2,1,power_law_1.01,3.5194942474365236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,2,1,power_law_1.01,3.5496063232421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,2,1,power_law_1.2,3.5358081817626954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,2,1,power_law_1.2,3.5432769775390627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,32,1,balanced,0.3781919876734416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,32,1,balanced,0.37885868549346924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,32,1,power_law_1.01,0.37750399112701416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,32,1,power_law_1.01,0.37912960052490235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,32,1,power_law_1.2,0.38080639839172364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,32,1,power_law_1.2,0.38188159465789795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,4,1,balanced,1.8160053888956706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,4,1,balanced,1.8184107144673665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,4,1,power_law_1.01,1.8430591583251954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,4,1,power_law_1.01,1.8661632537841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,4,1,power_law_1.2,1.8443071365356445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,4,1,power_law_1.2,1.84783992767334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,8,1,balanced,1.0058506329854329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,8,1,balanced,1.0072480042775471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,8,1,power_law_1.01,1.0028863906860352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,8,1,power_law_1.01,1.009670352935791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,8,1,power_law_1.2,1.0048831939697265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,16384,2,8,8,1,power_law_1.2,1.009171199798584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,1,balanced,5.121151924133301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,1,balanced,5.121775945027669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,1,power_law_1.01,5.4163776397705075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,1,power_law_1.01,5.438316726684571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,1,power_law_1.2,5.551302337646485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,1,power_law_1.2,5.583808135986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,128,balanced,0.7146346569061279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,128,balanced,0.7159146467844645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,128,power_law_1.01,0.8279168128967285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,128,power_law_1.01,0.8297920227050781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,128,power_law_1.2,0.8710080146789551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,128,power_law_1.2,0.8843903541564941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,16,balanced,0.9665226936340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,16,balanced,0.9721972942352295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,16,power_law_1.01,1.1499263763427734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,16,power_law_1.01,1.1508864402770995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,16,power_law_1.2,1.2063039779663085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,16,power_law_1.2,1.2119423866271972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,2,balanced,2.944239934285482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,2,balanced,2.946000099182129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,2,power_law_1.01,3.16748161315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,2,power_law_1.01,3.244345474243164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,2,power_law_1.2,3.346380615234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,2,power_law_1.2,3.3528446197509765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,256,balanced,0.6990400155385336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,256,balanced,0.6994240283966064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,256,power_law_1.01,0.7784575939178466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,256,power_law_1.01,0.7822080135345459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,256,power_law_1.2,0.8577471733093261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,256,power_law_1.2,0.8675519943237304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,32,balanced,0.8235200246175131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,32,balanced,0.8238613605499268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,32,power_law_1.01,0.9695232391357422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,32,power_law_1.01,1.0066944122314454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,32,power_law_1.2,1.0329471588134767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,32,power_law_1.2,1.0421055793762206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,4,balanced,1.8185173670450847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,4,balanced,1.8206720352172852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,4,power_law_1.01,2.058745574951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,4,power_law_1.01,2.0659584045410155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,4,power_law_1.2,2.173420715332031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,4,power_law_1.2,2.1985919952392576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,64,balanced,0.7521066665649414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,64,balanced,0.7526240348815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,64,power_law_1.01,0.861945629119873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,64,power_law_1.01,0.8675840377807618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,64,power_law_1.2,0.9614080429077149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,64,power_law_1.2,1.0068415641784667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,8,balanced,1.2223893006642659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,8,balanced,1.225648005803426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,8,power_law_1.01,1.4346752166748047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,8,power_law_1.01,1.4422592163085937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,8,power_law_1.2,1.560582447052002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,1,8,power_law_1.2,1.5631039619445801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,16,1,balanced,0.831712007522583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,16,1,balanced,0.8328320185343424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,16,1,power_law_1.01,0.849830436706543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,16,1,power_law_1.01,0.8520575523376465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,16,1,power_law_1.2,0.8571840286254883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,16,1,power_law_1.2,0.8606207847595215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,2,1,balanced,2.795546531677246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,2,1,balanced,2.7963892618815103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,2,1,power_law_1.01,2.9646591186523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,2,1,power_law_1.01,2.967424011230469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,2,1,power_law_1.2,3.021855926513672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,2,1,power_law_1.2,3.0428543090820312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,4,1,balanced,1.6189173062642415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,4,1,balanced,1.6197867393493652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,4,1,power_law_1.01,1.7013631820678712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,4,1,power_law_1.01,1.706150436401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,4,1,power_law_1.2,1.7281984329223632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,4,1,power_law_1.2,1.7367616653442384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,8,1,balanced,1.8050506909688313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,8,1,balanced,1.807439963022868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,8,1,power_law_1.01,2.0373760223388673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,8,1,power_law_1.01,2.0416000366210936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,8,1,power_law_1.2,2.043903923034668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2048,8,256,8,1,power_law_1.2,2.0615871429443358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,1,balanced,5.7742665608723955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,1,balanced,5.781781514485677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,1,power_law_1.01,5.8085182189941404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,1,power_law_1.01,5.814969635009765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,1,power_law_1.2,5.8531646728515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,1,power_law_1.2,5.902668762207031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,16,balanced,1.0474507013956706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,16,balanced,1.0502346356709797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,16,power_law_1.01,1.3044095993041993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,16,power_law_1.01,1.3646592140197753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,16,power_law_1.2,1.3940671920776366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,16,power_law_1.2,1.4551615715026855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,2,balanced,3.294794718424479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,2,balanced,3.295898755391439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,2,power_law_1.01,3.4635711669921876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,2,power_law_1.01,3.525126266479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,2,power_law_1.2,3.512684631347656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,2,power_law_1.2,3.5949825286865233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,32,balanced,0.8790079752604166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,32,balanced,0.8812212944030762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,32,power_law_1.01,1.0844608306884767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,32,power_law_1.01,1.0962495803833008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,32,power_law_1.2,1.195251178741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,32,power_law_1.2,1.2728960037231445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,4,balanced,1.9880852699279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,4,balanced,1.9891039530436199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,4,power_law_1.01,2.218886375427246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,4,power_law_1.01,2.260588836669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,4,power_law_1.2,2.260537528991699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,4,power_law_1.2,2.295315170288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,8,balanced,1.3522027333577473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,8,balanced,1.3527679443359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,8,power_law_1.01,1.564908790588379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,8,power_law_1.01,1.6574720382690429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,8,power_law_1.2,1.694086456298828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,1,8,power_law_1.2,1.714841651916504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,2,1,balanced,3.1375252405802407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,2,1,balanced,3.1399412155151367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,2,1,power_law_1.01,3.1473535537719726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,2,1,power_law_1.01,3.158995246887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,2,1,power_law_1.2,3.174284744262695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,2,1,power_law_1.2,3.1836671829223633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,4,1,balanced,1.7784053484598796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,4,1,balanced,1.7793973286946614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,4,1,power_law_1.01,1.7710016250610352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,4,1,power_law_1.01,1.7766399383544922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,4,1,power_law_1.2,1.7794559478759766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,6144,2560,8,160,4,1,power_law_1.2,1.7929855346679688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,1,balanced,5.912570953369141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,1,balanced,5.915653228759766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,1,power_law_1.01,6.227308654785157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,1,power_law_1.01,6.251424026489258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,1,power_law_1.2,6.4170684814453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,1,power_law_1.2,6.434905242919922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,128,balanced,0.7740320364634196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,128,balanced,0.7749866644541422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,128,power_law_1.01,0.8871616363525391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,128,power_law_1.01,0.9072640419006348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,128,power_law_1.2,0.9736000061035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,128,power_law_1.2,0.9929856300354004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,16,balanced,1.07258137067159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,16,balanced,1.0729066530863445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,16,power_law_1.01,1.2613951683044433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,16,power_law_1.01,1.3149439811706543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,16,power_law_1.2,1.3892736434936523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,16,power_law_1.2,1.4097536087036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,2,balanced,3.3780320485432944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,2,balanced,3.3797601064046225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,2,power_law_1.01,3.703859329223633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,2,power_law_1.01,3.7089984893798826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,2,power_law_1.2,3.869388961791992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,2,power_law_1.2,3.9050113677978517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,256,balanced,0.7558240095774332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,256,balanced,0.7565493583679199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,256,power_law_1.01,0.8477824211120606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,256,power_law_1.01,0.8504063606262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,256,power_law_1.2,0.928831958770752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,256,power_law_1.2,0.972646427154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,32,balanced,0.9036213556925455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,32,balanced,0.904917319615682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,32,power_law_1.01,1.0736127853393556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,32,power_law_1.01,1.095468807220459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,32,power_law_1.2,1.1689663887023927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,32,power_law_1.2,1.1990912437438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,4,balanced,2.0643946329752603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,4,balanced,2.06550931930542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,4,power_law_1.01,2.339603233337402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,4,power_law_1.01,2.369260787963867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,4,power_law_1.2,2.5315519332885743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,4,power_law_1.2,2.5372480392456054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,64,balanced,0.8174826304117838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,64,balanced,0.8212746779123942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,64,power_law_1.01,0.9469056129455566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,64,power_law_1.01,0.9806719779968261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,64,power_law_1.2,1.0093759536743163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,64,power_law_1.2,1.0454719543457032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,8,balanced,1.3643892606099446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,8,balanced,1.3665332794189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,8,power_law_1.01,1.5529088020324706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,8,power_law_1.01,1.6264703750610352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,8,power_law_1.2,1.7205631256103515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,1,8,power_law_1.2,1.728531265258789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,16,1,balanced,0.960746685663859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,16,1,balanced,0.9625493685404459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,16,1,power_law_1.01,0.9793600082397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,16,1,power_law_1.01,0.9806655883789063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,16,1,power_law_1.2,0.9935935974121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,16,1,power_law_1.2,0.9951295852661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,2,1,balanced,3.2313547134399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,2,1,balanced,3.2345546086629233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,2,1,power_law_1.01,3.421984100341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,2,1,power_law_1.01,3.4361087799072267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,2,1,power_law_1.2,3.4897537231445312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,2,1,power_law_1.2,3.531302261352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,4,1,balanced,1.870240052541097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,4,1,balanced,1.872037410736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,4,1,power_law_1.01,1.9539648056030274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,4,1,power_law_1.01,1.9710399627685546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,4,1,power_law_1.2,2.003059196472168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,4,1,power_law_1.2,2.0047807693481445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,8,1,balanced,2.095285256703695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,8,1,balanced,2.0972906748453775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,8,1,power_law_1.01,2.366815948486328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,8,1,power_law_1.01,2.3695232391357424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,8,1,power_law_1.2,2.3785919189453124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,256,8,1,power_law_1.2,2.380179214477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,1,balanced,5.163690567016602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,1,balanced,5.167189280192058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,1,power_law_1.01,7.189740753173828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,1,power_law_1.01,7.233523559570313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,1,power_law_1.2,7.5393730163574215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,1,power_law_1.2,7.541260528564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,128,balanced,0.8201546669006348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,128,balanced,0.8219626744588217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,128,power_law_1.01,0.9336511611938476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,128,power_law_1.01,0.954860782623291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,128,power_law_1.2,0.9791359901428223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,128,power_law_1.2,0.9874688148498535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,16,balanced,1.0724426905314128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,16,balanced,1.0746506849924724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,16,power_law_1.01,1.3508543968200684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,16,power_law_1.01,1.3807552337646485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,16,power_law_1.2,1.406835174560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,16,power_law_1.2,1.412889575958252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,2,balanced,3.0412267049153647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,2,balanced,3.043285369873047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,2,power_law_1.01,4.161139297485351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,2,power_law_1.01,4.181990432739258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,2,power_law_1.2,4.367647933959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,2,power_law_1.2,4.384595108032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,32,balanced,0.9327253500620524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,32,balanced,0.9338239828745524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,32,power_law_1.01,1.1170944213867187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,32,power_law_1.01,1.1328384399414062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,32,power_law_1.2,1.1916864395141602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,32,power_law_1.2,1.1960639953613281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,4,balanced,1.9237866401672363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,4,balanced,1.9278826713562012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,4,power_law_1.01,2.592140769958496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,4,power_law_1.01,2.658316802978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,4,power_law_1.2,2.7036159515380858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,4,power_law_1.2,2.8554880142211916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,64,balanced,0.8558666706085205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,64,balanced,0.8572746912638346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,64,power_law_1.01,1.0126591682434083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,64,power_law_1.01,1.0375231742858886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,64,power_law_1.2,1.0559103965759278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,64,power_law_1.2,1.1069055557250977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,8,balanced,1.3628427187601726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,8,balanced,1.3636852900187175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,8,power_law_1.01,1.8121919631958008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,8,power_law_1.01,1.814873504638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,8,power_law_1.2,1.8406143188476562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,1,8,power_law_1.2,1.8604608535766602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,16,1,balanced,0.8973546822865804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,16,1,balanced,0.8993919690450033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,16,1,power_law_1.01,1.1262911796569823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,16,1,power_law_1.01,1.129535961151123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,16,1,power_law_1.2,1.1473728179931642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,16,1,power_law_1.2,1.1583680152893066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,2,1,balanced,2.839445432027181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,2,1,balanced,2.8437067667643228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,2,1,power_law_1.01,3.9227264404296873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,2,1,power_law_1.01,3.948896026611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,2,1,power_law_1.2,4.0661567687988285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,2,1,power_law_1.2,4.125305557250977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,4,1,balanced,1.721882661183675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,4,1,balanced,1.7235840161641438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,4,1,power_law_1.01,2.2739519119262694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,4,1,power_law_1.01,2.3060543060302736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,4,1,power_law_1.2,2.366022491455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,4,1,power_law_1.2,2.388057518005371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,8,1,balanced,1.1736586888631184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,8,1,balanced,1.1766080061594646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,8,1,power_law_1.01,1.4891903877258301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,8,1,power_law_1.01,1.4899583816528321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,8,1,power_law_1.2,1.546560001373291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,3072,7168,2048,8,384,8,1,power_law_1.2,1.5477631568908692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,1,balanced,0.14840533336003622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,1,balanced,0.14890133341153464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,1,power_law_1.01,0.12713600397109986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,1,power_law_1.01,0.12828160524368287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,1,power_law_1.2,0.1266111969947815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,1,power_law_1.2,0.12737280130386353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,128,balanced,0.03965866565704346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,128,balanced,0.03979733337958654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,128,power_law_1.01,0.03760640025138855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,128,power_law_1.01,0.037676799297332766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,128,power_law_1.2,0.03761279881000519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,128,power_law_1.2,0.03765760064125061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,16,balanced,0.04254400233427683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,16,balanced,0.04365866879622141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,16,power_law_1.01,0.04147840142250061
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,16,power_law_1.01,0.04191359877586365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,16,power_law_1.2,0.04016000032424927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,16,power_law_1.2,0.04044800102710724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,2,balanced,0.09557333588600159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,2,balanced,0.09597333272298177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,2,power_law_1.01,0.08601599931716919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,2,power_law_1.01,0.08760319948196411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,2,power_law_1.2,0.08361600041389465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,2,power_law_1.2,0.08891519904136658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,32,balanced,0.0394400010506312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,32,balanced,0.03990400085846583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,32,power_law_1.01,0.03795199990272522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,32,power_law_1.01,0.03806720077991486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,32,power_law_1.2,0.03811199963092804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,32,power_law_1.2,0.03813120126724243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,4,balanced,0.0650079995393753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,4,balanced,0.06614399949709575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,4,power_law_1.01,0.06130560040473938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,4,power_law_1.01,0.061817598342895505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,4,power_law_1.2,0.0605184018611908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,4,power_law_1.2,0.06120960116386413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,64,balanced,0.039488000174363456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,64,balanced,0.03973866750796636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,64,power_law_1.01,0.03763200044631958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,64,power_law_1.01,0.03776000142097473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,64,power_law_1.2,0.03772160112857818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,64,power_law_1.2,0.03814400136470795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,8,balanced,0.05572799841562907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,8,balanced,0.05601066847642263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,8,power_law_1.01,0.04990079998970032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,8,power_law_1.01,0.05196160078048706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,8,power_law_1.2,0.05065600275993347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,1,8,power_law_1.2,0.05144320130348205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,2,1,balanced,0.0969599982102712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,2,1,balanced,0.09843732913335164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,2,1,power_law_1.01,0.08829439878463745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,2,1,power_law_1.01,0.08855040073394775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,2,1,power_law_1.2,0.08828160166740417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,2048,768,8,128,2,1,power_law_1.2,0.08862720131874084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,1,balanced,0.6151626507441202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,1,balanced,0.6152533292770386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,1,power_law_1.01,0.3383296012878418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,1,power_law_1.01,0.346777606010437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,1,power_law_1.2,0.30703999996185305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,1,power_law_1.2,0.3142591953277588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,128,balanced,0.05118933320045471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,128,balanced,0.052154665191968284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,128,power_law_1.01,0.05126399993896484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,128,power_law_1.01,0.052179199457168576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,128,power_law_1.2,0.05121279954910278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,128,power_law_1.2,0.05203840136528015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,16,balanced,0.07901333272457123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,16,balanced,0.07945066690444946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,16,power_law_1.01,0.07511680126190186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,16,power_law_1.01,0.07700480222702026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,16,power_law_1.2,0.07415680289268493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,16,power_law_1.2,0.07496320009231568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,2,balanced,0.338645339012146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,2,balanced,0.34354666868845624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,2,power_law_1.01,0.20817921161651612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,2,power_law_1.01,0.20999679565429688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,2,power_law_1.2,0.19263999462127684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,2,power_law_1.2,0.20499839782714843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,256,balanced,0.04985600213209788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,256,balanced,0.05106666684150696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,256,power_law_1.01,0.0474047988653183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,256,power_law_1.01,0.04872959852218628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,256,power_law_1.2,0.047775998711586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,256,power_law_1.2,0.050329601764678954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,32,balanced,0.07047999898592631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,32,balanced,0.07158400118350983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,32,power_law_1.01,0.06255999803543091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,32,power_law_1.01,0.06505600214004517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,32,power_law_1.2,0.06245120167732239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,32,power_law_1.2,0.06547200083732604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,4,balanced,0.19264533122380575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,4,balanced,0.1942453384399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,4,power_law_1.01,0.1449087977409363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,4,power_law_1.01,0.1462656021118164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,4,power_law_1.2,0.13596800565719605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,4,power_law_1.2,0.1498304009437561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,64,balanced,0.056159997979799904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,64,balanced,0.057775999108950295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,64,power_law_1.01,0.054073601961135864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,64,power_law_1.01,0.05578879714012146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,64,power_law_1.2,0.053427201509475705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,64,power_law_1.2,0.053990399837493895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,8,balanced,0.12679466605186462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,8,balanced,0.1300159990787506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,8,power_law_1.01,0.11509120464324951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,8,power_law_1.2,0.09737600088119507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,1,8,power_law_1.2,0.10784640312194824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,2,1,balanced,0.33429865042368573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,2,1,balanced,0.3349226713180542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,2,1,power_law_1.01,0.18831360340118408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,2,1,power_law_1.01,0.19482879638671874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,2,1,power_law_1.2,0.1821887969970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,2,1,power_law_1.2,0.18532480001449586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,4,1,balanced,0.20307733615239462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,4,1,balanced,0.2031573255856832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,4,1,power_law_1.01,0.13008639812469483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,4,1,power_law_1.01,0.1319615960121155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,4,1,power_law_1.2,0.12212480306625366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,3072,1536,8,256,4,1,power_law_1.2,0.1224511981010437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,1,balanced,0.29973334074020386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,1,balanced,0.3045919934908549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,1,power_law_1.01,0.2999039888381958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,1,power_law_1.01,0.30167040824890134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,1,power_law_1.2,0.2966399908065796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,1,power_law_1.2,0.29989120960235593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,2,balanced,0.22004266579945883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,2,balanced,0.22954134146372476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,2,power_law_1.01,0.21235198974609376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,2,power_law_1.01,0.2128511905670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,2,power_law_1.2,0.21227519512176513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,2,power_law_1.2,0.21311359405517577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,4,balanced,0.1684160033861796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,4,balanced,0.17031466960906982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,4,power_law_1.01,0.1816831946372986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,4,power_law_1.01,0.1866368055343628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,4,power_law_1.2,0.1881343960762024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,4,power_law_1.2,0.1897536039352417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,8,balanced,0.16224533319473267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,8,balanced,0.1629813313484192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,8,power_law_1.01,0.16242560148239135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,8,power_law_1.01,0.16316159963607788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,8,power_law_1.2,0.16313600540161133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,1,8,power_law_1.2,0.16344319581985473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,16,1,balanced,0.05552533268928528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,16,1,balanced,0.05607999861240387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,16,1,power_law_1.01,0.051712000370025636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,16,1,power_law_1.01,0.05196160078048706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,16,1,power_law_1.2,0.05354239940643311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,16,1,power_law_1.2,0.055430400371551516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,2,1,balanced,0.16737600167592367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,2,1,balanced,0.16810667514801025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,2,1,power_law_1.01,0.16049280166625976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,2,1,power_law_1.01,0.16179200410842895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,2,1,power_law_1.2,0.16330879926681519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,2,1,power_law_1.2,0.16343040466308595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,4,1,balanced,0.09698667128880818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,4,1,balanced,0.10261866450309753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,4,1,power_law_1.01,0.0942143976688385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,4,1,power_law_1.01,0.09472640156745911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,4,1,power_law_1.2,0.0941760003566742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,4,1,power_law_1.2,0.09422720074653626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,8,1,balanced,0.0702453354994456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,8,1,balanced,0.07026666899522145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,8,1,power_law_1.01,0.06800640225410462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,8,1,power_law_1.01,0.06967039704322815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,8,1,power_law_1.2,0.0692736029624939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,14336,2,8,8,1,power_law_1.2,0.06928640007972717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,1,balanced,0.42712001005808514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,1,balanced,0.4299413363138835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,1,power_law_1.01,0.3695103883743286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,1,power_law_1.01,0.37703039646148684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,1,power_law_1.2,0.3678143978118896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,1,power_law_1.2,0.37662079334259035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,128,balanced,0.05400000015894572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,128,balanced,0.0543093333641688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,128,power_law_1.01,0.05416319966316223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,128,power_law_1.01,0.05512319803237915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,128,power_law_1.2,0.05443840026855469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,128,power_law_1.2,0.054995197057724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,16,balanced,0.07841066519419353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,16,balanced,0.0823520024617513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,16,power_law_1.01,0.07779840230941773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,16,power_law_1.01,0.07809919714927674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,16,power_law_1.2,0.07603840231895446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,16,power_law_1.2,0.07749760150909424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,2,balanced,0.24210667610168457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,2,balanced,0.2447999914487203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,2,power_law_1.01,0.21716480255126952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,2,power_law_1.01,0.21916799545288085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,2,power_law_1.2,0.21583359241485595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,2,power_law_1.2,0.22041599750518798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,32,balanced,0.06555733581384023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,32,balanced,0.06704533100128174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,32,power_law_1.01,0.0615231990814209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,32,power_law_1.01,0.06220160126686096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,32,power_law_1.2,0.06332799792289734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,32,power_law_1.2,0.06680319905281067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,4,balanced,0.15100266536076865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,4,balanced,0.15543466806411743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,4,power_law_1.01,0.13464959859848022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,4,power_law_1.01,0.14421759843826293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,4,power_law_1.2,0.1402176022529602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,4,power_law_1.2,0.14291839599609374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,64,balanced,0.05776533484458923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,64,balanced,0.059605335195859276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,64,power_law_1.01,0.05635200142860412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,64,power_law_1.01,0.05864319801330566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,64,power_law_1.2,0.05621119737625122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,64,power_law_1.2,0.05822719931602478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,8,balanced,0.09135466814041138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,8,balanced,0.0922826627890269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,8,power_law_1.01,0.0880895972251892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,8,power_law_1.01,0.08925439715385437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,8,power_law_1.2,0.08647040128707886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,1,8,power_law_1.2,0.08849920034408569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,2,1,balanced,0.24944533904393515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,2,1,balanced,0.2500159939130147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,2,1,power_law_1.01,0.2126847982406616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,2,1,power_law_1.01,0.2147200107574463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,2,1,power_law_1.2,0.2141887903213501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,2,1,power_law_1.2,0.21666560173034669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,4,1,balanced,0.15755200386047363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,4,1,balanced,0.15953600406646729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,4,1,power_law_1.01,0.14238719940185546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,4,1,power_law_1.01,0.14529279470443726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,4,1,power_law_1.2,0.1450111985206604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,1536,8,128,4,1,power_law_1.2,0.14526079893112182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,1,balanced,2.6931838989257812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,1,balanced,2.693434715270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,1,power_law_1.01,2.000172805786133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,1,power_law_1.01,2.0193855285644533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,1,power_law_1.2,1.9767999649047852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,1,power_law_1.2,1.989593505859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,128,balanced,0.09065600236256917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,128,balanced,0.09289066990216573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,128,power_law_1.01,0.09145600199699402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,128,power_law_1.01,0.09200639724731445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,128,power_law_1.2,0.08948479890823365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,128,power_law_1.2,0.09223039746284485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,16,balanced,0.23637332518895468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,16,balanced,0.23826134204864502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,16,power_law_1.01,0.22802560329437255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,16,power_law_1.01,0.23092479705810548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,16,power_law_1.2,0.21304960250854493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,16,power_law_1.2,0.2257920026779175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,2,balanced,1.3814613024393718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,2,balanced,1.382815996805827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,2,power_law_1.01,1.083353614807129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,2,power_law_1.01,1.1035327911376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,2,power_law_1.2,1.0807488441467286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,2,power_law_1.2,1.115443229675293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,256,balanced,0.07893333335717519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,256,balanced,0.08347733815511067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,256,power_law_1.01,0.07932800054550171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,256,power_law_1.01,0.07946239709854126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,256,power_law_1.2,0.08060799837112427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,256,power_law_1.2,0.08161919713020324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,32,balanced,0.1553546686967214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,32,balanced,0.15782933433850607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,32,power_law_1.01,0.1380735993385315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,32,power_law_1.01,0.13998080492019654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,32,power_law_1.2,0.14265600442886353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,32,power_law_1.2,0.143014395236969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,4,balanced,0.7277599970499674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,4,balanced,0.7303413550059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,4,power_law_1.01,0.6360511779785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,4,power_law_1.01,0.658841609954834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,4,power_law_1.2,0.6461440086364746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,4,power_law_1.2,0.6470143795013428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,64,balanced,0.10365333159764607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,64,balanced,0.10408000151316325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,64,power_law_1.01,0.10109440088272095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,64,power_law_1.01,0.102566397190094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,64,power_law_1.2,0.10115840435028076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,64,power_law_1.2,0.10236159563064576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,8,balanced,0.39819733301798504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,8,balanced,0.3982880115509033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,8,power_law_1.01,0.3545664072036743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,8,power_law_1.01,0.3971967935562134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,8,power_law_1.2,0.3350719928741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,4096,2688,22,512,1,8,power_law_1.2,0.36824960708618165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,1,balanced,0.4569600025812785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,1,balanced,0.45899200439453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,1,power_law_1.01,0.4559040069580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,1,power_law_1.01,0.45795841217041017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,1,power_law_1.2,0.45011200904846194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,1,power_law_1.2,0.45413761138916015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,2,balanced,0.2916640043258667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,2,balanced,0.3292959928512573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,2,power_law_1.01,0.3174911975860596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,2,power_law_1.01,0.3198015928268433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,2,power_law_1.2,0.31310720443725587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,2,power_law_1.2,0.31994879245758057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,4,balanced,0.19847466548283896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,4,balanced,0.19924267133076987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,4,power_law_1.01,0.22357120513916015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,4,power_law_1.01,0.22942719459533692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,4,power_law_1.2,0.22048640251159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,4,power_law_1.2,0.22079999446868898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,8,balanced,0.17735467354456583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,8,balanced,0.17907732725143433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,8,power_law_1.01,0.17847039699554443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,8,power_law_1.01,0.1793727993965149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,8,power_law_1.2,0.17904000282287597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,1,8,power_law_1.2,0.1827455997467041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,16,1,balanced,0.07240533332029979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,16,1,balanced,0.07328533132870992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,16,1,power_law_1.01,0.07112320065498352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,16,1,power_law_1.01,0.07120000123977661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,16,1,power_law_1.2,0.0713599979877472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,16,1,power_law_1.2,0.07171840071678162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,2,1,balanced,0.24324800570805868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,2,1,balanced,0.24567999442418417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,2,1,power_law_1.01,0.24961280822753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,2,1,power_law_1.01,0.25136001110076905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,2,1,power_law_1.2,0.23963520526885987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,2,1,power_law_1.2,0.24673919677734374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,32,1,balanced,0.05808533231417338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,32,1,balanced,0.059877331058184304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,32,1,power_law_1.01,0.05569919943809509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,32,1,power_law_1.01,0.05767040252685547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,32,1,power_law_1.2,0.05737599730491638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,32,1,power_law_1.2,0.057555198669433594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,4,1,balanced,0.13770133256912231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,4,1,balanced,0.17335999011993408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,4,1,power_law_1.01,0.1349184036254883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,4,1,power_law_1.01,0.14180480241775512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,4,1,power_law_1.2,0.13882240056991577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,4,1,power_law_1.2,0.14488960504531861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,8,1,balanced,0.09259200096130371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,8,1,balanced,0.09731733798980713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,8,1,power_law_1.01,0.09234560132026673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,8,1,power_law_1.01,0.09466239809989929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,8,1,power_law_1.2,0.09225599765777588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,16384,2,8,8,1,power_law_1.2,0.0923520028591156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,1,balanced,1.5595146814982097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,1,balanced,1.5633333524068196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,1,power_law_1.01,0.8229056358337402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,1,power_law_1.01,0.8245120048522949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,1,power_law_1.2,0.740012788772583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,1,power_law_1.2,0.7619647979736328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,128,balanced,0.07843199868996938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,128,balanced,0.08141333361466725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,128,power_law_1.01,0.07662720084190369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,128,power_law_1.01,0.07861120104789734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,128,power_law_1.2,0.07575039863586426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,128,power_law_1.2,0.07622399926185608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,16,balanced,0.14792533715566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,16,balanced,0.1507306694984436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,16,power_law_1.01,0.1270143985748291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,16,power_law_1.01,0.13033599853515626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,16,power_law_1.2,0.1196671962738037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,16,power_law_1.2,0.13515520095825195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,2,balanced,0.8105013370513916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,2,balanced,0.8108906745910645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,2,power_law_1.01,0.4586495876312256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,2,power_law_1.01,0.46830081939697266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,2,power_law_1.2,0.43912320137023925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,2,power_law_1.2,0.46556801795959474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,256,balanced,0.07031466563542683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,256,balanced,0.07060266534487407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,256,power_law_1.01,0.066457599401474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,256,power_law_1.01,0.0692351996898651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,256,power_law_1.2,0.06816639900207519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,256,power_law_1.2,0.07120000123977661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,32,balanced,0.10762666662534077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,32,balanced,0.10935466488202412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,32,power_law_1.01,0.09955840110778809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,32,power_law_1.01,0.1028223991394043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,32,power_law_1.2,0.09662719964981079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,32,power_law_1.2,0.10042239427566528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,4,balanced,0.44391465187072754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,4,balanced,0.44512001673380536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,4,power_law_1.01,0.28431999683380127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,4,power_law_1.01,0.3153791904449463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,4,power_law_1.2,0.2876032114028931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,4,power_law_1.2,0.2901376008987427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,64,balanced,0.09150399764378865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,64,balanced,0.09155199925104777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,64,power_law_1.01,0.09094399809837342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,64,power_law_1.01,0.09096959829330445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,64,power_law_1.2,0.08831999897956848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,64,power_law_1.2,0.08888319730758668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,8,balanced,0.24337067206700644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,8,balanced,0.24361600478490195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,8,power_law_1.01,0.23590400218963622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,8,power_law_1.01,0.23946878910064698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,8,power_law_1.2,0.15883519649505615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,1,8,power_law_1.2,0.23303680419921874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,16,1,balanced,0.18082133928934732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,16,1,balanced,0.18238933881123862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,16,1,power_law_1.01,0.11829760074615478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,16,1,power_law_1.01,0.11860480308532714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,16,1,power_law_1.2,0.11388159990310669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,16,1,power_law_1.2,0.11404160261154175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,2,1,balanced,0.8015626271565756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,2,1,balanced,0.8037280241648356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,2,1,power_law_1.01,0.43601279258728026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,2,1,power_law_1.01,0.4500095844268799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,2,1,power_law_1.2,0.4034304141998291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,2,1,power_law_1.2,0.41899518966674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,4,1,balanced,0.4522240161895752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,4,1,balanced,0.455077330271403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,4,1,power_law_1.01,0.24488320350646972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,4,1,power_law_1.01,0.2465343952178955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,4,1,power_law_1.2,0.23303680419921874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,4,1,power_law_1.2,0.23698561191558837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,8,1,balanced,0.30429333448410034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,8,1,balanced,0.31031999985376996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,8,1,power_law_1.01,0.1671231985092163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,8,1,power_law_1.01,0.16833920478820802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,8,1,power_law_1.2,0.15237760543823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2048,8,256,8,1,power_law_1.2,0.16151039600372313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,1,balanced,1.2347839673360188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,1,balanced,1.2411573727925618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,1,power_law_1.01,0.957363224029541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,1,power_law_1.01,0.9745599746704101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,1,power_law_1.2,0.9697343826293945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,1,power_law_1.2,0.971225643157959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,16,balanced,0.12430933117866516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,16,balanced,0.12550933162371317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,16,power_law_1.01,0.11461759805679321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,16,power_law_1.01,0.11594239473342896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,16,power_law_1.2,0.11491199731826782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,16,power_law_1.2,0.11811200380325318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,2,balanced,0.65775465965271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,2,balanced,0.6598933140436808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,2,power_law_1.01,0.5279744148254395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,2,power_law_1.01,0.5640639781951904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,2,power_law_1.2,0.5279551982879639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,2,power_law_1.2,0.5535168170928955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,32,balanced,0.10549867153167725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,32,balanced,0.10876267155011494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,32,power_law_1.01,0.0998848021030426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,32,power_law_1.01,0.10491520166397095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,32,power_law_1.2,0.10172799825668336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,32,power_law_1.2,0.10264320373535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,4,balanced,0.3534880081812541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,4,balanced,0.35672001043955487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,4,power_law_1.01,0.31806719303131104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,4,power_law_1.01,0.326528000831604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,4,power_law_1.2,0.30002560615539553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,4,power_law_1.2,0.31447041034698486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,8,balanced,0.2125813364982605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,8,balanced,0.21618133783340454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,8,power_law_1.01,0.20641920566558838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,8,power_law_1.01,0.20755200386047362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,8,power_law_1.2,0.20190720558166503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,1,8,power_law_1.2,0.20444159507751464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,2,1,balanced,0.6532320181528727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,2,1,balanced,0.6539146502812704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,2,1,power_law_1.01,0.5201216220855713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,2,1,power_law_1.01,0.5217152118682862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,2,1,power_law_1.2,0.5097792148590088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,2,1,power_law_1.2,0.5149248123168946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,4,1,balanced,0.3705493211746216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,4,1,balanced,0.3733439842859904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,4,1,power_law_1.01,0.302291202545166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,4,1,power_law_1.01,0.30550398826599123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,4,1,power_law_1.2,0.2929215908050537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,6144,2560,8,160,4,1,power_law_1.2,0.29806718826293943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,1,balanced,1.8190080324808757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,1,balanced,1.8292800585428874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,1,power_law_1.01,0.9512319564819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,1,power_law_1.01,0.9650367736816406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,1,power_law_1.2,0.8690879821777344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,1,power_law_1.2,0.9041215896606445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,128,balanced,0.08841066559155782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,128,balanced,0.09115200241406758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,128,power_law_1.01,0.08746240139007569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,128,power_law_1.01,0.09123839735984803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,128,power_law_1.2,0.08699520230293274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,128,power_law_1.2,0.0881663978099823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,16,balanced,0.16290666659673056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,16,balanced,0.16293332974116007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,16,power_law_1.01,0.13903360366821288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,16,power_law_1.01,0.14894720315933227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,16,power_law_1.2,0.13438719511032104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,16,power_law_1.2,0.14167040586471558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,2,balanced,0.9437867005666097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,2,balanced,0.9445226987202963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,2,power_law_1.01,0.570572805404663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,2,power_law_1.01,0.5827072143554688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,2,power_law_1.2,0.5062335968017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,2,power_law_1.2,0.5366655826568604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,256,balanced,0.07549333572387695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,256,balanced,0.07766399780909221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,256,power_law_1.01,0.07315199971199035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,256,power_law_1.01,0.07407360076904297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,256,power_law_1.2,0.07491199970245362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,256,power_law_1.2,0.07697920203208923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,32,balanced,0.12101333340009053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,32,balanced,0.1216373344262441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,32,power_law_1.01,0.10787839889526367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,32,power_law_1.01,0.11050879955291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,32,power_law_1.2,0.10484479665756226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,32,power_law_1.2,0.10909440517425537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,4,balanced,0.508623997370402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,4,balanced,0.5105599959691366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,4,power_law_1.01,0.36373119354248046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,4,power_law_1.01,0.36631040573120116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,4,power_law_1.2,0.3573568105697632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,4,power_law_1.2,0.37857279777526853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,64,balanced,0.10132799545923869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,64,balanced,0.1018399993578593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,64,power_law_1.01,0.09752960205078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,64,power_law_1.01,0.09840000271797181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,64,power_law_1.2,0.096697598695755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,64,power_law_1.2,0.09998080134391785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,8,balanced,0.2791093389193217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,8,balanced,0.2813439965248108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,8,power_law_1.01,0.20206079483032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,8,power_law_1.01,0.25304958820343015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,8,power_law_1.2,0.22006399631500245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,1,8,power_law_1.2,0.23058559894561767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,16,1,balanced,0.20428800582885742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,16,1,balanced,0.20556267102559408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,16,1,power_law_1.01,0.13301759958267212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,16,1,power_law_1.01,0.13496320247650145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,16,1,power_law_1.2,0.12892160415649415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,16,1,power_law_1.2,0.1291327953338623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,2,1,balanced,0.947002649307251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,2,1,balanced,0.9478240013122559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,2,1,power_law_1.01,0.508076810836792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,2,1,power_law_1.01,0.5116479873657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,2,1,power_law_1.2,0.4629631996154785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,2,1,power_law_1.2,0.4917952060699463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,4,1,balanced,0.5233920017878214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,4,1,balanced,0.5251146554946899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,4,1,power_law_1.01,0.2858304023742676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,4,1,power_law_1.01,0.28901760578155516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,4,1,power_law_1.2,0.2724800109863281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,4,1,power_law_1.2,0.2732736110687256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,8,1,balanced,0.3436746597290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,8,1,balanced,0.34402668476104736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,8,1,power_law_1.01,0.19114240407943725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,8,1,power_law_1.01,0.192467200756073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,8,1,power_law_1.2,0.16773120164871216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,256,8,1,power_law_1.2,0.1697216033935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,1,balanced,1.8235839207967122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,1,balanced,1.82477871576945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,1,power_law_1.01,1.187001609802246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,1,power_law_1.01,1.2311552047729493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,1,power_law_1.2,1.086079978942871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,1,power_law_1.2,1.1055232048034669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,128,balanced,0.08965333302815755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,128,balanced,0.09129066268603007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,128,power_law_1.01,0.09039999842643738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,128,power_law_1.01,0.09162240028381348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,128,power_law_1.2,0.09290879964828491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,128,power_law_1.2,0.09553279876708984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,16,balanced,0.16332800189654031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,16,balanced,0.16375466187795004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,16,power_law_1.01,0.2216639995574951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,16,power_law_1.01,0.23331201076507568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,16,power_law_1.2,0.22700159549713134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,16,power_law_1.2,0.24642560482025147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,2,balanced,0.9405439694722494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,2,balanced,0.94159468015035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,2,power_law_1.01,0.6844543933868408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,2,power_law_1.01,0.7294335842132569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,2,power_law_1.2,0.5679423809051514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,2,power_law_1.2,0.6544447898864746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,32,balanced,0.12125866611798604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,32,balanced,0.12164266904195149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,32,power_law_1.01,0.13634560108184815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,32,power_law_1.01,0.14161920547485352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,32,power_law_1.2,0.1282240033149719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,32,power_law_1.2,0.13633919954299928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,4,balanced,0.5099253257115682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,4,balanced,0.5117066701253256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,4,power_law_1.01,0.4860288143157959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,4,power_law_1.01,0.498579216003418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,4,power_law_1.2,0.4600959777832031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,4,power_law_1.2,0.49157118797302246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,64,balanced,0.10240000486373901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,64,balanced,0.10242666800816853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,64,power_law_1.01,0.10264320373535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,64,power_law_1.01,0.10686719417572021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,64,power_law_1.2,0.10122879743576049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,64,power_law_1.2,0.10533759593963624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,8,balanced,0.2786986629168193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,8,balanced,0.27907200654347736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,8,power_law_1.01,0.3362943887710571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,8,power_law_1.01,0.3439039945602417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,8,power_law_1.2,0.34697599411010743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,1,8,power_law_1.2,0.3631808042526245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,16,1,balanced,0.20587732394536337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,16,1,balanced,0.2076373298962911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,16,1,power_law_1.01,0.1515328049659729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,16,1,power_law_1.01,0.1527999997138977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,16,1,power_law_1.2,0.14266239404678344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,16,1,power_law_1.2,0.14369280338287355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,2,1,balanced,0.9427839914957682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,2,1,balanced,0.9430239995320638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,2,1,power_law_1.01,0.6388671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,2,1,power_law_1.01,0.6455167770385742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,2,1,power_law_1.2,0.5606847763061523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,2,1,power_law_1.2,0.5742976188659668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,4,1,balanced,0.5416373411814371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,4,1,balanced,0.5427253246307373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,4,1,power_law_1.01,0.36586239337921145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,4,1,power_law_1.01,0.3772991895675659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,4,1,power_law_1.2,0.3146239995956421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,4,1,power_law_1.2,0.3395136117935181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,8,1,balanced,0.3194506764411926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,8,1,balanced,0.32038400570551556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,8,1,power_law_1.01,0.2420736074447632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,8,1,power_law_1.01,0.24410240650177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,8,1,power_law_1.2,0.20535039901733398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,32,7168,2048,8,384,8,1,power_law_1.2,0.2120512008666992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,1,balanced,0.20595200856526694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,1,balanced,0.20608532428741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,1,power_law_1.01,0.19203200340270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,1,power_law_1.01,0.19486080408096312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,1,power_law_1.2,0.1956480026245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,1,power_law_1.2,0.1969472050666809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,128,balanced,0.06241600215435028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,128,balanced,0.06369066735108693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,128,power_law_1.01,0.06383360028266907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,128,power_law_1.01,0.06536960005760192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,128,power_law_1.2,0.0650816023349762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,128,power_law_1.2,0.06515840291976929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,16,balanced,0.07062399884064992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,16,balanced,0.0719413310289383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,16,power_law_1.01,0.07240319848060608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,16,power_law_1.01,0.0733568012714386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,16,power_law_1.2,0.0718720018863678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,16,power_law_1.2,0.07362560033798218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,2,balanced,0.15317866206169128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,2,balanced,0.15380799770355225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,2,power_law_1.01,0.15756160020828247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,2,power_law_1.01,0.15813119411468507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,2,power_law_1.2,0.16128640174865722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,2,power_law_1.2,0.16167039871215821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,32,balanced,0.06663466493288676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,32,balanced,0.06729599833488464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,32,power_law_1.01,0.0667519986629486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,32,power_law_1.01,0.06719359755516052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,32,power_law_1.2,0.06751999855041504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,32,power_law_1.2,0.0679040014743805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,4,balanced,0.11334932843844096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,4,balanced,0.11458133657773335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,4,power_law_1.01,0.11521919965744018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,4,power_law_1.01,0.11562240123748779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,4,power_law_1.2,0.11488640308380127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,4,power_law_1.2,0.11672320365905761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,64,balanced,0.06404800216356914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,64,balanced,0.06644799808661143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,64,power_law_1.01,0.06479359865188598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,64,power_law_1.01,0.06600319743156433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,64,power_law_1.2,0.06593919992446899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,64,power_law_1.2,0.06606720089912414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,8,balanced,0.07957866787910461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,8,balanced,0.08240533371766408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,8,power_law_1.01,0.08171520233154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,8,power_law_1.01,0.08220800161361694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,8,power_law_1.2,0.08179200291633607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,1,8,power_law_1.2,0.08357759714126586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,2,1,balanced,0.13485866785049438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,2,1,balanced,0.13557866215705872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,2,1,power_law_1.01,0.12573440074920655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,2,1,power_law_1.01,0.12606719732284546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,2,1,power_law_1.2,0.12723840475082399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,2048,768,8,128,2,1,power_law_1.2,0.12937599420547485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,1,balanced,1.0647253195444744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,1,balanced,1.065008004506429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,1,power_law_1.01,0.9534976005554199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,1,power_law_1.01,0.9555456161499023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,1,power_law_1.2,0.9536704063415528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,1,power_law_1.2,0.9903936386108398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,128,balanced,0.12411200006802876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,128,balanced,0.12583999832471213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,128,power_law_1.01,0.12184319496154786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,128,power_law_1.01,0.12260479927062988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,128,power_law_1.2,0.1251520037651062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,128,power_law_1.2,0.12595200538635254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,16,balanced,0.18098666270573935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,16,balanced,0.18173333009084067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,16,power_law_1.01,0.17701120376586915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,16,power_law_1.01,0.17783039808273315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,16,power_law_1.2,0.17745920419692993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,16,power_law_1.2,0.17893120050430297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,2,balanced,0.5989386638005575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,2,balanced,0.5991040070851644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,2,power_law_1.01,0.5319295883178711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,2,power_law_1.01,0.5375360012054443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,2,power_law_1.2,0.5602240085601806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,2,power_law_1.2,0.564902400970459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,256,balanced,0.11969600121180217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,256,balanced,0.12148267030715942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,256,power_law_1.01,0.11875200271606445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,256,power_law_1.01,0.11941759586334229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,256,power_law_1.2,0.12117760181427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,256,power_law_1.2,0.12183680534362792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,32,balanced,0.15005866686503092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,32,balanced,0.15030399958292642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,32,power_law_1.01,0.14479999542236327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,32,power_law_1.01,0.14621440172195435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,32,power_law_1.2,0.14791040420532225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,32,power_law_1.2,0.15340160131454467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,4,balanced,0.3654986619949341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,4,balanced,0.3663040002187093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,4,power_law_1.01,0.33264000415802003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,4,power_law_1.01,0.3400511980056763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,4,power_law_1.2,0.33857920169830324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,4,power_law_1.2,0.3493760108947754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,64,balanced,0.13177067041397095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,64,balanced,0.13192533453305563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,64,power_law_1.01,0.1298815965652466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,64,power_law_1.01,0.13096959590911866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,64,power_law_1.2,0.13308800458908082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,64,power_law_1.2,0.13336960077285767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,8,balanced,0.24487467606862387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,8,balanced,0.24497600396474203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,8,power_law_1.01,0.2256256103515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,8,power_law_1.01,0.2347520112991333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,8,power_law_1.2,0.2362816095352173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,1,8,power_law_1.2,0.2381824016571045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,2,1,balanced,0.5955679814020792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,2,1,balanced,0.5956053336461385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,2,1,power_law_1.01,0.541542387008667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,2,1,power_law_1.01,0.5446784019470214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,2,1,power_law_1.2,0.5481279850006103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,2,1,power_law_1.2,0.5498752117156982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,4,1,balanced,0.3613813320795695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,4,1,balanced,0.36246931552886963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,4,1,power_law_1.01,0.3213696002960205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,4,1,power_law_1.01,0.32188799381256106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,4,1,power_law_1.2,0.324947190284729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,3072,1536,8,256,4,1,power_law_1.2,0.32912640571594237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,1,balanced,0.8064906597137451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,1,balanced,0.8094507058461508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,1,power_law_1.01,0.7745024204254151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,1,power_law_1.01,0.7807360172271729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,1,power_law_1.2,0.7805952072143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,1,power_law_1.2,0.7809855937957764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,2,balanced,0.47592000166575116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,2,balanced,0.4772426684697469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,2,power_law_1.01,0.48076801300048827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,2,power_law_1.01,0.5287936210632325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,2,power_law_1.2,0.4830848217010498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,2,power_law_1.2,0.5947968006134033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,4,balanced,0.36211200555165607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,4,balanced,0.362773338953654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,4,power_law_1.01,0.4020671844482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,4,power_law_1.01,0.40256638526916505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,4,power_law_1.2,0.4147520065307617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,4,power_law_1.2,0.42536320686340334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,8,balanced,0.29763732353846234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,8,balanced,0.30135466655095416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,8,power_law_1.01,0.358732795715332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,8,power_law_1.01,0.3619391918182373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,8,power_law_1.2,0.3555392026901245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,1,8,power_law_1.2,0.36055679321289064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,16,1,balanced,0.09745066364606221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,16,1,balanced,0.10162132978439331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,16,1,power_law_1.01,0.09559040069580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,16,1,power_law_1.01,0.09667199850082397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,16,1,power_law_1.2,0.09733759760856628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,16,1,power_law_1.2,0.09784960150718688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,2,1,balanced,0.44117867946624756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,2,1,balanced,0.44308265050252277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,2,1,power_law_1.01,0.41050238609313966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,2,1,power_law_1.01,0.42505598068237305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,2,1,power_law_1.2,0.4031680107116699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,2,1,power_law_1.2,0.426361608505249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,4,1,balanced,0.25810666879018146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,4,1,balanced,0.25888532400131226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,4,1,power_law_1.01,0.22729599475860596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,4,1,power_law_1.01,0.24457600116729736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,4,1,power_law_1.2,0.23216640949249268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,4,1,power_law_1.2,0.2383039951324463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,8,1,balanced,0.15061333775520325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,8,1,balanced,0.15412267049153647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,8,1,power_law_1.01,0.15101439952850343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,8,1,power_law_1.01,0.15162880420684816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,8,1,power_law_1.2,0.1503167986869812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,14336,2,8,8,1,power_law_1.2,0.15176960229873657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,1,balanced,0.7360640366872152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,1,balanced,0.7387359937032064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,1,power_law_1.01,0.7689151763916016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,1,power_law_1.01,0.7760064125061035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,1,power_law_1.2,0.7871615886688232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,1,power_law_1.2,0.7908031940460205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,128,balanced,0.10959999759991963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,128,balanced,0.1122773289680481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,128,power_law_1.01,0.1139456033706665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,128,power_law_1.01,0.11631360054016113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,128,power_law_1.2,0.11660799980163575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,128,power_law_1.2,0.11807359457015991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,16,balanced,0.14073066910107931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,16,balanced,0.14110933740933737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,16,power_law_1.01,0.14877439737319947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,16,power_law_1.01,0.15022720098495485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,16,power_law_1.2,0.1526975989341736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,16,power_law_1.2,0.15356800556182862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,2,balanced,0.4373226563135783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,2,balanced,0.4382293224334717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,2,power_law_1.01,0.4423935890197754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,2,power_law_1.01,0.44720001220703126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,2,power_law_1.2,0.44449281692504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,2,power_law_1.2,0.45111680030822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,32,balanced,0.12813333670298258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,32,balanced,0.13010133306185404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,32,power_law_1.01,0.12984319925308227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,32,power_law_1.01,0.13139840364456176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,32,power_law_1.2,0.13190399408340453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,32,power_law_1.2,0.13342080116271973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,4,balanced,0.2635040084520976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,4,balanced,0.2646720012029012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,4,power_law_1.01,0.2816512107849121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,4,power_law_1.01,0.28998401165008547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,4,power_law_1.2,0.2840192079544067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,4,power_law_1.2,0.30220799446105956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,64,balanced,0.12017066280047099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,64,balanced,0.12146133184432983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,64,power_law_1.01,0.12291200160980224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,64,power_law_1.01,0.12314239740371705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,64,power_law_1.2,0.12343679666519165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,64,power_law_1.2,0.12439680099487305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,8,balanced,0.19154133399327597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,8,balanced,0.19218132893244425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,8,power_law_1.01,0.19245439767837524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,8,power_law_1.01,0.19591039419174194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,8,power_law_1.2,0.1968127965927124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,1,8,power_law_1.2,0.1977280020713806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,2,1,balanced,0.35582931836446124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,2,1,balanced,0.3580160140991211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,2,1,power_law_1.01,0.33803520202636717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,2,1,power_law_1.01,0.3397056102752686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,2,1,power_law_1.2,0.3413183927536011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,2,1,power_law_1.2,0.34286720752716066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,4,1,balanced,0.22750933965047201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,4,1,balanced,0.22826667626698813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,4,1,power_law_1.01,0.21211519241333007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,4,1,power_law_1.01,0.21356799602508544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,4,1,power_law_1.2,0.21493120193481446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,1536,8,128,4,1,power_law_1.2,0.21575679779052734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,1,balanced,4.613946596781413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,1,balanced,4.614735921223958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,1,power_law_1.01,4.36682243347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,1,power_law_1.01,4.406272125244141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,1,power_law_1.2,4.562476730346679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,1,power_law_1.2,4.615660858154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,128,balanced,0.3930026690165202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,128,balanced,0.3940693140029907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,128,power_law_1.01,0.39791359901428225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,128,power_law_1.01,0.3988800048828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,128,power_law_1.2,0.4080383777618408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,128,power_law_1.2,0.4080639839172363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,16,balanced,0.6403306722640991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,16,balanced,0.6417920192082723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,16,power_law_1.01,0.6365824222564698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,16,power_law_1.01,0.6451263904571534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,16,power_law_1.2,0.6583551883697509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,16,power_law_1.2,0.6629951953887939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,2,balanced,2.5126612981160483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,2,balanced,2.5142666498819985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,2,power_law_1.01,2.397689628601074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,2,power_law_1.01,2.4006847381591796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,2,power_law_1.2,2.5047807693481445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,2,power_law_1.2,2.5256832122802733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,256,balanced,0.3744479815165202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,256,balanced,0.3766506512959798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,256,power_law_1.01,0.38265600204467776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,256,power_law_1.01,0.38304638862609863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,256,power_law_1.2,0.38754560947418215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,256,power_law_1.2,0.3879296064376831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,32,balanced,0.5018346707026163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,32,balanced,0.502128005027771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,32,power_law_1.01,0.5067391872406006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,32,power_law_1.01,0.5093376159667968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,32,power_law_1.2,0.522156810760498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,32,power_law_1.2,0.5233215808868408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,4,balanced,1.4472907384236653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,4,balanced,1.451573371887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,4,power_law_1.01,1.390617561340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,4,power_law_1.01,1.4030912399291993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,4,power_law_1.2,1.4778112411499023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,4,power_law_1.2,1.488704013824463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,64,balanced,0.4352586666742961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,64,balanced,0.43861865997314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,64,power_law_1.01,0.43930878639221194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,64,power_law_1.01,0.4448063850402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,64,power_law_1.2,0.445798397064209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,64,power_law_1.2,0.4463679790496826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,8,balanced,0.9141706625620524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,8,balanced,0.9182506402333578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,8,power_law_1.01,0.8978048324584961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,8,power_law_1.01,0.8996928215026856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,8,power_law_1.2,0.9170175552368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,4096,2688,22,512,1,8,power_law_1.2,0.9172863960266113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,1,balanced,1.280741294225057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,1,balanced,1.2809546788533528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,1,power_law_1.01,1.245958423614502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,1,power_law_1.01,1.247257614135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,1,power_law_1.2,1.2139904022216796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,1,power_law_1.2,1.220627212524414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,2,balanced,0.7795413335164388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,2,balanced,0.7807306448618571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,2,power_law_1.01,0.7977407932281494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,2,power_law_1.01,0.8114560127258301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,2,power_law_1.2,0.8199295997619629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,2,power_law_1.2,0.839846420288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,4,balanced,0.4727360010147095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,4,balanced,0.4761386712392171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,4,power_law_1.01,0.5896895885467529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,4,power_law_1.01,0.6304128170013428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,4,power_law_1.2,0.5556543827056885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,4,power_law_1.2,0.6348544120788574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,8,balanced,0.3747466802597046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,8,balanced,0.37548800309499103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,8,power_law_1.01,0.4811840057373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,8,power_law_1.01,0.4825535774230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,8,power_law_1.2,0.49013118743896483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,1,8,power_law_1.2,0.5003647804260254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,16,1,balanced,0.13662399848302206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,16,1,balanced,0.1379146675268809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,16,1,power_law_1.01,0.13388160467147828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,16,1,power_law_1.01,0.13496960401535035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,16,1,power_law_1.2,0.13373440504074097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,16,1,power_law_1.2,0.13388799428939818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,2,1,balanced,0.6662720044453939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,2,1,balanced,0.6675946712493896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,2,1,power_law_1.01,0.6581759929656983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,2,1,power_law_1.01,0.6605631828308105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,2,1,power_law_1.2,0.6556863784790039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,2,1,power_law_1.2,0.6598656177520752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,32,1,balanced,0.11036800344785054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,32,1,balanced,0.11401599645614624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,32,1,power_law_1.01,0.10995839834213257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,32,1,power_law_1.01,0.11263359785079956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,32,1,power_law_1.2,0.11510399580001832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,32,1,power_law_1.2,0.11519999504089355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,4,1,balanced,0.3817066748936971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,4,1,balanced,0.3834826548894246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,4,1,power_law_1.01,0.37690880298614504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,4,1,power_law_1.01,0.3771712064743042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,4,1,power_law_1.2,0.36849920749664306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,4,1,power_law_1.2,0.37784318923950194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,8,1,balanced,0.21753599246342978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,8,1,balanced,0.21862934033075967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,8,1,power_law_1.01,0.21582720279693604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,8,1,power_law_1.01,0.21647360324859619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,8,1,power_law_1.2,0.21577599048614501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,16384,2,8,8,1,power_law_1.2,0.21639680862426758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,1,balanced,2.6084799766540527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,1,balanced,2.610682646433512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,1,power_law_1.01,2.2721536636352537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,1,power_law_1.01,2.315839958190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,1,power_law_1.2,2.3600448608398437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,1,power_law_1.2,2.399443244934082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,128,balanced,0.20058133204778036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,128,balanced,0.2015413244565328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,128,power_law_1.01,0.19997440576553344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,128,power_law_1.01,0.20013439655303955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,128,power_law_1.2,0.20370559692382811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,128,power_law_1.2,0.20434560775756835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,16,balanced,0.33619733651479083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,16,balanced,0.33683733145395917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,16,power_law_1.01,0.32396159172058103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,16,power_law_1.01,0.3269504070281982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,16,power_law_1.2,0.3228800058364868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,16,power_law_1.2,0.3288896083831787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,2,balanced,1.400986671447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,2,balanced,1.4010826746622722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,2,power_law_1.01,1.2361472129821778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,2,power_law_1.01,1.2759360313415526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,2,power_law_1.2,1.2831808090209962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,2,power_law_1.2,1.2997247695922851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,256,balanced,0.196234663327535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,256,balanced,0.19781333208084106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,256,power_law_1.01,0.19406720399856567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,256,power_law_1.01,0.19500160217285156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,256,power_law_1.2,0.19645440578460693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,256,power_law_1.2,0.1975872039794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,32,balanced,0.2606933315594991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,32,balanced,0.2608960072199504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,32,power_law_1.01,0.25075840950012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,32,power_law_1.01,0.2550976037979126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,32,power_law_1.2,0.25550720691680906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,32,power_law_1.2,0.25851519107818605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,4,balanced,0.7999306519826254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,4,balanced,0.8005867004394531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,4,power_law_1.01,0.7382080078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,4,power_law_1.01,0.7404287815093994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,4,power_law_1.2,0.7472640037536621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,4,power_law_1.2,0.7522240161895752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,64,balanced,0.21749866008758545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,64,balanced,0.21787200371424356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,64,power_law_1.01,0.21418240070343017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,64,power_law_1.01,0.2141887903213501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,64,power_law_1.2,0.22076799869537353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,64,power_law_1.2,0.22473599910736083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,8,balanced,0.49235733350118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,8,balanced,0.4938826560974121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,8,power_law_1.01,0.44821758270263673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,8,power_law_1.01,0.4655360221862793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,8,power_law_1.2,0.47788801193237307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,1,8,power_law_1.2,0.4840832233428955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,16,1,balanced,0.3635840018590291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,16,1,balanced,0.3643519878387451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,16,1,power_law_1.01,0.343724799156189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,16,1,power_law_1.01,0.34427518844604493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,16,1,power_law_1.2,0.34561920166015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,16,1,power_law_1.2,0.348307204246521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,2,1,balanced,1.3926506042480469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,2,1,balanced,1.3934027353922527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,2,1,power_law_1.01,1.2520000457763671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,2,1,power_law_1.01,1.2528191566467286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,2,1,power_law_1.2,1.2782719612121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,2,1,power_law_1.2,1.2938240051269532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,4,1,balanced,0.4820106824239095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,4,1,balanced,0.4824213186899821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,4,1,power_law_1.01,0.48447360992431643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,4,1,power_law_1.01,0.4963007926940918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,4,1,power_law_1.2,0.49422078132629393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,4,1,power_law_1.2,0.5002816200256348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,8,1,balanced,0.30763200918833417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,8,1,balanced,0.31031467517217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,8,1,power_law_1.01,0.3285952091217041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,8,1,power_law_1.01,0.3305344104766846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,8,1,power_law_1.2,0.3323391914367676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2048,8,256,8,1,power_law_1.2,0.33379199504852297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,1,balanced,2.0788745880126953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,1,balanced,2.0794827143351235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,1,power_law_1.01,2.0303359985351563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,1,power_law_1.01,2.0771648406982424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,1,power_law_1.2,2.141804885864258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,1,power_law_1.2,2.158310317993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,16,balanced,0.285098671913147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,16,balanced,0.28547199567159015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,16,power_law_1.01,0.287609601020813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,16,power_law_1.01,0.2878079891204834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,16,power_law_1.2,0.29258880615234373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,16,power_law_1.2,0.2971519947052002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,2,balanced,1.120421330134074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,2,balanced,1.1219786802927654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,2,power_law_1.01,1.125171184539795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,2,power_law_1.01,1.1446144104003906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,2,power_law_1.2,1.1303808212280273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,2,power_law_1.2,1.1734463691711425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,32,balanced,0.21792000532150269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,32,balanced,0.2182933290799459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,32,power_law_1.01,0.229369592666626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,32,power_law_1.01,0.23143041133880615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,32,power_law_1.2,0.24408960342407227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,32,power_law_1.2,0.2464063882827759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,4,balanced,0.6394453446070353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,4,balanced,0.641045331954956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,4,power_law_1.01,0.6465919971466064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,4,power_law_1.01,0.6539072036743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,4,power_law_1.2,0.6598400115966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,4,power_law_1.2,0.6863296031951904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,8,balanced,0.40303464730580646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,8,balanced,0.403711994489034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,8,power_law_1.01,0.40015997886657717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,8,power_law_1.01,0.41648001670837403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,8,power_law_1.2,0.4400576114654541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,1,8,power_law_1.2,0.44197759628295896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,2,1,balanced,1.1071253617604573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,2,1,balanced,1.10753599802653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,2,1,power_law_1.01,1.1060352325439453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,2,1,power_law_1.01,1.109721565246582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,2,1,power_law_1.2,1.1533120155334473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,2,1,power_law_1.2,1.1603903770446777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,4,1,balanced,0.3834880193074544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,4,1,balanced,0.38442134857177734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,4,1,power_law_1.01,0.46233601570129396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,4,1,power_law_1.01,0.4653503894805908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,4,1,power_law_1.2,0.47354879379272463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,6144,2560,8,160,4,1,power_law_1.2,0.47420802116394045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,1,balanced,3.035344123840332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,1,balanced,3.03657595316569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,1,power_law_1.01,2.667180824279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,1,power_law_1.01,2.6784896850585938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,1,power_law_1.2,2.753830337524414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,1,power_law_1.2,2.7927936553955077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,128,balanced,0.22487467527389526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,128,balanced,0.22679466009140015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,128,power_law_1.01,0.22568318843841553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,128,power_law_1.01,0.22602880001068115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,128,power_law_1.2,0.22653439044952392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,128,power_law_1.2,0.22965760231018068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,16,balanced,0.3782026767730713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,16,balanced,0.3796159823735555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,16,power_law_1.01,0.36769280433654783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,16,power_law_1.01,0.3719871997833252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,16,power_law_1.2,0.37370240688323975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,16,power_law_1.2,0.3810816049575806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,2,balanced,1.6237279574076335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,2,balanced,1.624714692433675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,2,power_law_1.01,1.444179153442383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,2,power_law_1.01,1.4468607902526855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,2,power_law_1.2,1.4591936111450194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,2,power_law_1.2,1.5229120254516602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,256,balanced,0.21896000703175864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,256,balanced,0.22006400426228842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,256,power_law_1.01,0.21863040924072266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,256,power_law_1.01,0.21967999935150145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,256,power_law_1.2,0.22137598991394042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,256,power_law_1.2,0.22145280838012696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,32,balanced,0.2876853346824646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,32,balanced,0.2883946696917216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,32,power_law_1.01,0.27730560302734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,32,power_law_1.01,0.28067200183868407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,32,power_law_1.2,0.2871936082839966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,32,power_law_1.2,0.29393279552459717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,4,balanced,0.9183786710103353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,4,balanced,0.9184746742248535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,4,power_law_1.01,0.824403190612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,4,power_law_1.01,0.8587967872619628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,4,power_law_1.2,0.8491519927978516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,4,power_law_1.2,0.885427188873291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,64,balanced,0.23879466454188028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,64,balanced,0.23959465821584067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,64,power_law_1.01,0.23675520420074464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,64,power_law_1.01,0.2377471923828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,64,power_law_1.2,0.24141440391540528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,64,power_law_1.2,0.250220799446106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,8,balanced,0.5687040090560913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,8,balanced,0.5687413215637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,8,power_law_1.01,0.502348804473877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,8,power_law_1.01,0.5339456081390381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,8,power_law_1.2,0.556550407409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,1,8,power_law_1.2,0.5587520122528076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,16,1,balanced,0.41890132427215576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,16,1,balanced,0.4191253185272217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,16,1,power_law_1.01,0.39324159622192384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,16,1,power_law_1.01,0.39562880992889404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,16,1,power_law_1.2,0.4011072158813477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,16,1,power_law_1.2,0.40203518867492677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,2,1,balanced,1.622869332631429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,2,1,balanced,1.6238346099853516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,2,1,power_law_1.01,1.408403205871582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,2,1,power_law_1.01,1.4876416206359864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,2,1,power_law_1.2,1.4743231773376464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,2,1,power_law_1.2,1.5186176300048828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,4,1,balanced,0.5599040190378824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,4,1,balanced,0.5608853499094645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,4,1,power_law_1.01,0.5663487911224365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,4,1,power_law_1.01,0.5695360183715821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,4,1,power_law_1.2,0.5779583930969239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,4,1,power_law_1.2,0.5793536186218262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,8,1,balanced,0.3582346836725871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,8,1,balanced,0.36106133460998535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,8,1,power_law_1.01,0.38127360343933103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,8,1,power_law_1.01,0.3828223943710327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,8,1,power_law_1.2,0.385369610786438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,256,8,1,power_law_1.2,0.38837759494781493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,1,balanced,4.472458521525065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,1,balanced,4.474800109863281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,1,power_law_1.01,3.638092803955078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,1,power_law_1.01,3.67154541015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,1,power_law_1.2,3.6497535705566406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,1,power_law_1.2,3.6619583129882813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,128,balanced,0.2820693254470825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,128,balanced,0.2832053303718567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,128,power_law_1.01,0.27692160606384275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,128,power_law_1.01,0.28101119995117185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,128,power_law_1.2,0.28044800758361815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,128,power_law_1.2,0.2812288045883179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,16,balanced,0.5223360061645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,16,balanced,0.5240213473637899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,16,power_law_1.01,0.48596482276916503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,16,power_law_1.01,0.49141759872436525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,16,power_law_1.2,0.48864002227783204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,16,power_law_1.2,0.49171199798583987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,2,balanced,2.3669439951578775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,2,balanced,2.367237408955892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,2,power_law_1.01,1.9870080947875977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,2,power_law_1.01,2.037388801574707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,2,power_law_1.2,1.9341888427734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,2,power_law_1.2,2.085772705078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,32,balanced,0.38950932025909424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,32,balanced,0.39262934525807697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,32,power_law_1.01,0.3736191987991333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,32,power_law_1.01,0.3806207895278931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,32,power_law_1.2,0.37185919284820557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,32,power_law_1.2,0.3829823970794678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,4,balanced,1.3165547053019206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,4,balanced,1.319648027420044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,4,power_law_1.01,1.1313152313232422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,4,power_law_1.01,1.1370304107666016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,4,power_law_1.2,1.1284543991088867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,4,power_law_1.2,1.1355392456054687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,64,balanced,0.3168213367462158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,64,balanced,0.3182613253593445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,64,power_law_1.01,0.3121920108795166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,64,power_law_1.01,0.31617920398712157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,64,power_law_1.2,0.3072704076766968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,64,power_law_1.2,0.30933120250701907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,8,balanced,0.7912480036417643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,8,balanced,0.7923093636830648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,8,power_law_1.01,0.6703040122985839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,8,power_law_1.01,0.7290688037872315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,8,power_law_1.2,0.6586431980133056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,1,8,power_law_1.2,0.7029823780059814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,16,1,balanced,0.3401973247528076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,16,1,balanced,0.3407786687215169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,16,1,power_law_1.01,0.3145663976669312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,16,1,power_law_1.01,0.31741440296173096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,16,1,power_law_1.2,0.3156928062438965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,16,1,power_law_1.2,0.3209791898727417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,2,1,balanced,2.3774612744649253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,2,1,balanced,2.3776532808939614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,2,1,power_law_1.01,1.9507007598876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,2,1,power_law_1.01,1.9584192276000976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,2,1,power_law_1.2,1.9355648040771485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,2,1,power_law_1.2,1.9737024307250977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,4,1,balanced,1.3537012736002605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,4,1,balanced,1.356778621673584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,4,1,power_law_1.01,1.135308837890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,4,1,power_law_1.01,1.1468480110168457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,4,1,power_law_1.2,1.119206428527832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,4,1,power_law_1.2,1.1359616279602052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,8,1,balanced,0.4792533318201701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,8,1,balanced,0.4813599983851115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,8,1,power_law_1.01,0.43948798179626464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,8,1,power_law_1.01,0.4417088031768799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,8,1,power_law_1.2,0.4454847812652588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,320,7168,2048,8,384,8,1,power_law_1.2,0.44754562377929685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,1,balanced,0.20945066213607788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,1,balanced,0.21006399393081665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,1,power_law_1.01,0.21461760997772217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,1,power_law_1.01,0.21527678966522218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,1,power_law_1.2,0.21787519454956056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,1,power_law_1.2,0.21829121112823485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,128,balanced,0.06746133168538411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,128,balanced,0.06914133330186208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,128,power_law_1.01,0.06846079826354981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,128,power_law_1.01,0.06928640007972717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,128,power_law_1.2,0.07088000178337098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,128,power_law_1.2,0.07277439832687378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,16,balanced,0.07838933169841766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,16,balanced,0.07866666714350383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,16,power_law_1.01,0.0803391993045807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,16,power_law_1.01,0.08203520178794861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,16,power_law_1.2,0.07868800163269044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,16,power_law_1.2,0.08140159845352173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,2,balanced,0.1597813367843628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,2,balanced,0.1602666676044464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,2,power_law_1.01,0.16885119676589966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,2,power_law_1.01,0.17288960218429567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,2,power_law_1.2,0.17704319953918457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,2,power_law_1.2,0.17861119508743287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,32,balanced,0.07208000123500824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,32,balanced,0.07307733098665874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,32,power_law_1.01,0.07266560196876526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,32,power_law_1.01,0.07276800274848938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,32,power_law_1.2,0.07269759774208069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,32,power_law_1.2,0.07361279726028443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,4,balanced,0.11931199828783672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,4,balanced,0.11993066469828288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,4,power_law_1.01,0.1221119999885559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,4,power_law_1.01,0.12231680154800414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,4,power_law_1.2,0.12349439859390259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,4,power_law_1.2,0.12416640520095826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,64,balanced,0.06811733543872833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,64,balanced,0.07027199864387512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,64,power_law_1.01,0.0705407977104187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,64,power_law_1.01,0.07056000232696533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,64,power_law_1.2,0.07160959839820862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,64,power_law_1.2,0.07167360186576843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,8,balanced,0.08894933263460796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,8,balanced,0.08898133039474487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,8,power_law_1.01,0.09126399755477906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,8,power_law_1.01,0.09283840060234069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,8,power_law_1.2,0.09245439767837524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,1,8,power_law_1.2,0.09337599873542786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,2,1,balanced,0.13675199945767721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,2,1,balanced,0.13793067137400308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,2,1,power_law_1.01,0.13687039613723756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,2,1,power_law_1.01,0.13956480026245116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,2,1,power_law_1.2,0.1416640043258667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,2048,768,8,128,2,1,power_law_1.2,0.14254720211029054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,1,balanced,1.0741759936014812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,1,balanced,1.0742080211639404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,1,power_law_1.01,0.9660160064697265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,1,power_law_1.01,0.9870911598205566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,1,power_law_1.2,1.0196800231933594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,1,power_law_1.2,1.028332805633545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,128,balanced,0.130021333694458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,128,balanced,0.13181333740552267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,128,power_law_1.01,0.13018879890441895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,128,power_law_1.01,0.1306496024131775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,128,power_law_1.2,0.13269120454788208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,128,power_law_1.2,0.13276159763336182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,16,balanced,0.1891253391901652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,16,balanced,0.19013333320617676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,16,power_law_1.01,0.18407039642333983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,16,power_law_1.01,0.18607360124588013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,16,power_law_1.2,0.187827205657959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,16,power_law_1.2,0.1928704023361206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,2,balanced,0.6074133316675822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,2,balanced,0.6080053249994913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,2,power_law_1.01,0.5560639858245849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,2,power_law_1.01,0.5626495838165283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,2,power_law_1.2,0.5650496006011962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,2,power_law_1.2,0.580838394165039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,256,balanced,0.12591999769210815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,256,balanced,0.12595199545224509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,256,power_law_1.01,0.12782080173492433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,256,power_law_1.01,0.12839679718017577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,256,power_law_1.2,0.12738560438156127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,256,power_law_1.2,0.1299456000328064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,32,balanced,0.1572373310724894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,32,balanced,0.1583093305428823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,32,power_law_1.01,0.15322240591049194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,32,power_law_1.01,0.15356800556182862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,32,power_law_1.2,0.1578752040863037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,32,power_law_1.2,0.16009600162506105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,4,balanced,0.3738400141398112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,4,balanced,0.37417598565419513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,4,power_law_1.01,0.33851521015167235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,4,power_law_1.01,0.349452805519104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,4,power_law_1.2,0.3598272085189819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,4,power_law_1.2,0.3682240009307861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,64,balanced,0.14009066422780356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,64,balanced,0.14043733477592468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,64,power_law_1.01,0.1409216046333313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,64,power_law_1.01,0.14142080545425414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,64,power_law_1.2,0.14132479429244996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,64,power_law_1.2,0.1415552020072937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,8,balanced,0.25062400102615356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,8,balanced,0.2526666720708211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,8,power_law_1.01,0.24046080112457274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,8,power_law_1.01,0.2424704074859619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,8,power_law_1.2,0.2506943941116333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,1,8,power_law_1.2,0.2508608102798462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,2,1,balanced,0.6018773317337036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,2,1,balanced,0.6028693517049154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,2,1,power_law_1.01,0.5516223907470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,2,1,power_law_1.01,0.5557504177093506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,2,1,power_law_1.2,0.5724736213684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,2,1,power_law_1.2,0.5787263870239258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,4,1,balanced,0.36665598551432294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,4,1,balanced,0.36719465255737305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,4,1,power_law_1.01,0.32284159660339357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,4,1,power_law_1.01,0.32743039131164553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,4,1,power_law_1.2,0.3306623935699463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,3072,1536,8,256,4,1,power_law_1.2,0.3364736080169678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,1,balanced,0.824677308400472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,1,balanced,0.8268160025278727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,1,power_law_1.01,0.8346240043640136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,1,power_law_1.01,0.8346688270568847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,1,power_law_1.2,0.8335871696472168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,1,power_law_1.2,0.8472319602966308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,2,balanced,0.49193068345387775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,2,balanced,0.493343989054362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,2,power_law_1.01,0.6018623828887939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,2,power_law_1.01,0.6071680068969727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,2,power_law_1.2,0.5351808071136475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,2,power_law_1.2,0.6577023983001709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,4,balanced,0.37597866853078205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,4,balanced,0.37616535027821857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,4,power_law_1.01,0.4609792232513428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,4,power_law_1.01,0.4958975791931152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,4,power_law_1.2,0.4580992221832275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,4,power_law_1.2,0.4872576236724854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,8,balanced,0.31435734033584595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,8,balanced,0.31681599219640094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,8,power_law_1.01,0.40254721641540525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,8,power_law_1.01,0.40641279220581056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,8,power_law_1.2,0.404691219329834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,1,8,power_law_1.2,0.40657920837402345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,16,1,balanced,0.10276800394058228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,16,1,balanced,0.10355200370152791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,16,1,power_law_1.01,0.1012992024421692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,16,1,power_law_1.01,0.10209920406341552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,16,1,power_law_1.2,0.10190080404281616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,16,1,power_law_1.2,0.10199040174484253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,2,1,balanced,0.4503146807352702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,2,1,balanced,0.450602650642395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,2,1,power_law_1.01,0.4413951873779297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,2,1,power_law_1.01,0.44780797958374025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,2,1,power_law_1.2,0.44425601959228517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,2,1,power_law_1.2,0.45172481536865233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,4,1,balanced,0.2612266739209493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,4,1,balanced,0.2654613256454468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,4,1,power_law_1.01,0.2626368045806885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,4,1,power_law_1.01,0.2636672019958496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,4,1,power_law_1.2,0.25736958980560304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,4,1,power_law_1.2,0.26204800605773926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,8,1,balanced,0.1553866664568583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,8,1,balanced,0.15938666462898254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,8,1,power_law_1.01,0.1561535954475403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,8,1,power_law_1.01,0.1562880039215088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,8,1,power_law_1.2,0.15607680082321168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,14336,2,8,8,1,power_law_1.2,0.1561535954475403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,1,balanced,0.747770627339681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,1,balanced,0.7482346693674723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,1,power_law_1.01,0.7919936180114746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,1,power_law_1.01,0.8053695678710937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,1,power_law_1.2,0.8203392028808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,1,power_law_1.2,0.8287103652954102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,128,balanced,0.12190933028856914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,128,balanced,0.12583999832471213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,128,power_law_1.01,0.12704000473022461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,128,power_law_1.01,0.12839679718017577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,128,power_law_1.2,0.12865279912948607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,128,power_law_1.2,0.12926080226898193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,16,balanced,0.1479200025399526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,16,balanced,0.14893333117167154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,16,power_law_1.01,0.16506880521774292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,16,power_law_1.01,0.16536959409713745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,16,power_law_1.2,0.1677248001098633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,16,power_law_1.2,0.16858880519866942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,2,balanced,0.4465493361155192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,2,balanced,0.44814932346343994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,2,power_law_1.01,0.4652224063873291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,2,power_law_1.01,0.4738175868988037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,2,power_law_1.2,0.4883456230163574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,2,power_law_1.2,0.4949952125549316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,32,balanced,0.13666133085886636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,32,balanced,0.1376533309618632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,32,power_law_1.01,0.1388479948043823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,32,power_law_1.01,0.14013439416885376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,32,power_law_1.2,0.13983999490737914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,32,power_law_1.2,0.14198399782180787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,4,balanced,0.27261332670847577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,4,balanced,0.2746613423029582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,4,power_law_1.01,0.3002559900283813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,4,power_law_1.01,0.30753920078277586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,4,power_law_1.2,0.31254398822784424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,4,power_law_1.2,0.3158720016479492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,64,balanced,0.12983999649683634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,64,balanced,0.13004799683888754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,64,power_law_1.01,0.130457603931427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,64,power_law_1.01,0.13258880376815796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,64,power_law_1.2,0.1335360050201416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,64,power_law_1.2,0.13392640352249147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,8,balanced,0.1997599999109904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,8,balanced,0.20001065731048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,8,power_law_1.01,0.20373120307922363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,8,power_law_1.01,0.20829439163208008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,8,power_law_1.2,0.2123136043548584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,1,8,power_law_1.2,0.21466240882873536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,2,1,balanced,0.36400532722473145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,2,1,balanced,0.36483200391133624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,2,1,power_law_1.01,0.37329280376434326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,2,1,power_law_1.01,0.3767551898956299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,2,1,power_law_1.2,0.37969279289245605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,2,1,power_law_1.2,0.38519039154052737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,4,1,balanced,0.2310133377710978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,4,1,balanced,0.23122133811314902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,4,1,power_law_1.01,0.2371903896331787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,4,1,power_law_1.01,0.23955199718475342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,4,1,power_law_1.2,0.23959040641784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,1536,8,128,4,1,power_law_1.2,0.24061439037322999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,1,balanced,4.666666666666667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,1,balanced,4.66922664642334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,1,power_law_1.01,4.5617023468017575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,1,power_law_1.01,4.628947067260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,1,power_law_1.2,4.779584121704102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,1,power_law_1.2,4.8008575439453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,128,balanced,0.4286773204803467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,128,balanced,0.4293653170267741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,128,power_law_1.01,0.4400383949279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,128,power_law_1.01,0.443174409866333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,128,power_law_1.2,0.44591360092163085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,128,power_law_1.2,0.44997119903564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,16,balanced,0.6758826573689779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,16,balanced,0.6772747039794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,16,power_law_1.01,0.6868351936340332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,16,power_law_1.01,0.6886720180511474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,16,power_law_1.2,0.7056128025054932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,16,power_law_1.2,0.7087168216705322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,2,balanced,2.5576799710591636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,2,balanced,2.5592586199442544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,2,power_law_1.01,2.509350395202637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,2,power_law_1.01,2.5281280517578124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,2,power_law_1.2,2.620505523681641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,2,power_law_1.2,2.6236799240112303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,256,balanced,0.4082719882329305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,256,balanced,0.41074132919311523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,256,power_law_1.01,0.41880321502685547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,256,power_law_1.01,0.42028160095214845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,256,power_law_1.2,0.4274752140045166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,256,power_law_1.2,0.4284992218017578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,32,balanced,0.53657599290212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,32,balanced,0.5375786622365316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,32,power_law_1.01,0.5493184089660644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,32,power_law_1.01,0.5568831920623779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,32,power_law_1.2,0.5560959815979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,32,power_law_1.2,0.5594944000244141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,4,balanced,1.4861173629760742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,4,balanced,1.488906701405843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,4,power_law_1.01,1.4805439949035644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,4,power_law_1.01,1.4919168472290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,4,power_law_1.2,1.5298815727233888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,4,power_law_1.2,1.5527551651000977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,64,balanced,0.46929065386454266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,64,balanced,0.4701226552327474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,64,power_law_1.01,0.48052477836608887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,64,power_law_1.01,0.4826240062713623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,64,power_law_1.2,0.4854144096374512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,64,power_law_1.2,0.48650240898132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,8,balanced,0.9515519936879476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,8,balanced,0.9528693358103434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,8,power_law_1.01,0.9440640449523926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,8,power_law_1.01,0.9913344383239746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,8,power_law_1.2,0.9735808372497559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,4096,2688,22,512,1,8,power_law_1.2,0.9970623970031738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,1,balanced,1.2998507022857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,1,balanced,1.301151990890503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,1,power_law_1.01,1.3124608039855956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,1,power_law_1.01,1.3213888168334962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,1,power_law_1.2,1.340556812286377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,1,power_law_1.2,1.3627840042114259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,2,balanced,0.8000586827596029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,2,balanced,0.8000853061676025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,2,power_law_1.01,0.9562560081481933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,2,power_law_1.01,0.9784768104553223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,2,power_law_1.2,0.9469759941101075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,2,power_law_1.2,0.965670394897461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,4,balanced,0.4903999964396159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,4,balanced,0.4943093458811442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,4,power_law_1.01,0.6776832103729248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,4,power_law_1.01,0.7693439960479737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,4,power_law_1.2,0.7198847770690918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,4,power_law_1.2,0.7622655868530274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,8,balanced,0.38972798983256024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,8,balanced,0.39016000429789227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,8,power_law_1.01,0.4989759922027588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,8,power_law_1.01,0.5349055767059326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,8,power_law_1.2,0.5525951862335206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,1,8,power_law_1.2,0.56430082321167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,16,1,balanced,0.13904533783594766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,16,1,balanced,0.14203733205795288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,16,1,power_law_1.01,0.1381183981895447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,16,1,power_law_1.01,0.13953919410705568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,16,1,power_law_1.2,0.1391487956047058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,16,1,power_law_1.2,0.13998080492019654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,2,1,balanced,0.6744693120320638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,2,1,balanced,0.6748853524525961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,2,1,power_law_1.01,0.7011136054992676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,2,1,power_law_1.01,0.7120768070220947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,2,1,power_law_1.2,0.6923136234283447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,2,1,power_law_1.2,0.7102015972137451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,32,1,balanced,0.11896000305811565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,32,1,balanced,0.12129066387812297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,32,1,power_law_1.01,0.11886719465255738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,32,1,power_law_1.01,0.11960320472717285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,32,1,power_law_1.2,0.11912959814071655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,32,1,power_law_1.2,0.12094080448150635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,4,1,balanced,0.38604267438252765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,4,1,balanced,0.3891679843266805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,4,1,power_law_1.01,0.3886080026626587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,4,1,power_law_1.01,0.38946559429168703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,4,1,power_law_1.2,0.38656001091003417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,4,1,power_law_1.2,0.38762879371643066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,8,1,balanced,0.22489066918691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,8,1,balanced,0.2267520030339559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,8,1,power_law_1.01,0.22274560928344728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,8,1,power_law_1.01,0.22485120296478273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,8,1,power_law_1.2,0.2234112024307251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,16384,2,8,8,1,power_law_1.2,0.2358783960342407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,1,balanced,2.628448009490967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,1,balanced,2.6288320223490396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,1,power_law_1.01,2.338553619384766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,1,power_law_1.01,2.3587263107299803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,1,power_law_1.2,2.4364160537719726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,1,power_law_1.2,2.453023910522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,128,balanced,0.21196266015370688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,128,balanced,0.21208532651265463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,128,power_law_1.01,0.21150720119476318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,128,power_law_1.01,0.21247999668121337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,128,power_law_1.2,0.2159872055053711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,128,power_law_1.2,0.21675519943237304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,16,balanced,0.3505493402481079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,16,balanced,0.35075732072194415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,16,power_law_1.01,0.34007039070129397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,16,power_law_1.01,0.3461375951766968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,16,power_law_1.2,0.34812800884246825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,16,power_law_1.2,0.3502271890640259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,2,balanced,1.4178560574849446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,2,balanced,1.4188480377197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,2,power_law_1.01,1.2870847702026367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,2,power_law_1.01,1.295468807220459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,2,power_law_1.2,1.3420672416687012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,2,power_law_1.2,1.3637248039245606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,256,balanced,0.20562134186426798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,256,balanced,0.2064639925956726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,256,power_law_1.01,0.20643200874328613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,256,power_law_1.01,0.20689280033111573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,256,power_law_1.2,0.20746240615844727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,256,power_law_1.2,0.20799360275268555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,32,balanced,0.27436800797780353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,32,balanced,0.27509333690007526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,32,power_law_1.01,0.26725120544433595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,32,power_law_1.01,0.27355520725250243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,32,power_law_1.2,0.2786240100860596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,32,power_law_1.2,0.28922879695892334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,4,balanced,0.8170186678568522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,4,balanced,0.8175199826558431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,4,power_law_1.01,0.7685311794281006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,4,power_law_1.01,0.7694719791412353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,4,power_law_1.2,0.789958381652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,4,power_law_1.2,0.7916287899017334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,64,balanced,0.2290346622467041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,64,balanced,0.23058666785558066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,64,power_law_1.01,0.22746241092681885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,64,power_law_1.01,0.2278143882751465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,64,power_law_1.2,0.23239679336547853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,64,power_law_1.2,0.23997440338134765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,8,balanced,0.5054346720377604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,8,balanced,0.5060319900512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,8,power_law_1.01,0.48336639404296877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,8,power_law_1.01,0.4974720001220703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,8,power_law_1.2,0.487775993347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,1,8,power_law_1.2,0.49855999946594237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,16,1,balanced,0.3697226842244466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,16,1,balanced,0.3708639939626058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,16,1,power_law_1.01,0.3512831926345825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,16,1,power_law_1.01,0.3534912109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,16,1,power_law_1.2,0.35797119140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,16,1,power_law_1.2,0.35934081077575686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,2,1,balanced,1.4047999382019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,2,1,balanced,1.405626614888509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,2,1,power_law_1.01,1.2653311729431151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,2,1,power_law_1.01,1.2890687942504884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,2,1,power_law_1.2,1.346835231781006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,2,1,power_law_1.2,1.3501055717468262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,4,1,balanced,0.49167998631795246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,4,1,balanced,0.4940640131632487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,4,1,power_law_1.01,0.5112895965576172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,4,1,power_law_1.01,0.5167232036590577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,4,1,power_law_1.2,0.521721601486206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,4,1,power_law_1.2,0.5322559833526611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,8,1,balanced,0.31860800584157306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,8,1,balanced,0.3195573290189107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,8,1,power_law_1.01,0.35146241188049315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,8,1,power_law_1.01,0.3517823934555054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,8,1,power_law_1.2,0.3577215909957886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2048,8,256,8,1,power_law_1.2,0.3580607891082764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,1,balanced,2.096245288848877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,1,balanced,2.098149299621582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,1,power_law_1.01,2.130784034729004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,1,power_law_1.01,2.1416831970214845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,1,power_law_1.2,2.1607295989990236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,1,power_law_1.2,2.2313535690307615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,16,balanced,0.29654399553934735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,16,balanced,0.29808000723520917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,16,power_law_1.01,0.3172287940979004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,16,power_law_1.01,0.3267008066177368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,16,power_law_1.2,0.31911680698394773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,16,power_law_1.2,0.34175360202789307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,2,balanced,1.1389973163604736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,2,balanced,1.1404159863789876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,2,power_law_1.01,1.1683712005615234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,2,power_law_1.01,1.1883456230163574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,2,power_law_1.2,1.196025562286377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,2,power_law_1.2,1.2161855697631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,32,balanced,0.23061333100001016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,32,balanced,0.23176000515619913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,32,power_law_1.01,0.24641919136047363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,32,power_law_1.01,0.2525887966156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,32,power_law_1.2,0.26257920265197754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,32,power_law_1.2,0.266048002243042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,4,balanced,0.6546453237533569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,4,balanced,0.655349334081014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,4,power_law_1.01,0.683839988708496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,4,power_law_1.01,0.6918015956878663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,4,power_law_1.2,0.6777599811553955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,4,power_law_1.2,0.7180031776428223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,8,balanced,0.41818666458129883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,8,balanced,0.4195626576741536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,8,power_law_1.01,0.4440192222595215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,8,power_law_1.01,0.4571712017059326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,8,power_law_1.2,0.45112318992614747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,1,8,power_law_1.2,0.4544896125793457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,2,1,balanced,1.1184319655100505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,2,1,balanced,1.120149294535319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,2,1,power_law_1.01,1.1681920051574708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,2,1,power_law_1.01,1.174790382385254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,2,1,power_law_1.2,1.1885631561279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,2,1,power_law_1.2,1.193830394744873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,4,1,balanced,0.5454506476720175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,4,1,balanced,0.5461973349253336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,4,1,power_law_1.01,0.5032192230224609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,4,1,power_law_1.01,0.5049088001251221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,4,1,power_law_1.2,0.517139196395874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,6144,2560,8,160,4,1,power_law_1.2,0.5196671962738038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,1,balanced,3.054101308186849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,1,balanced,3.0543254216512046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,1,power_law_1.01,2.778816032409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,1,power_law_1.01,2.785772705078125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,1,power_law_1.2,2.840780830383301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,1,power_law_1.2,2.9131776809692385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,128,balanced,0.23630932966868082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,128,balanced,0.23826666673024496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,128,power_law_1.01,0.2367232084274292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,128,power_law_1.01,0.23776640892028808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,128,power_law_1.2,0.23995521068572997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,128,power_law_1.2,0.2434175968170166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,16,balanced,0.3935146729151408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,16,balanced,0.39370131492614746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,16,power_law_1.01,0.3672895908355713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,16,power_law_1.01,0.38489599227905275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,16,power_law_1.2,0.38895359039306643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,16,power_law_1.2,0.4176511764526367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,2,balanced,1.6411199569702148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,2,balanced,1.642229398091634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,2,power_law_1.01,1.5072128295898437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,2,power_law_1.01,1.5201663970947266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,2,power_law_1.2,1.5598336219787599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,2,power_law_1.2,1.5657664299011231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,256,balanced,0.23036799828211466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,256,balanced,0.23119999965031943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,256,power_law_1.01,0.23219199180603028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,256,power_law_1.01,0.23235199451446534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,256,power_law_1.2,0.23175039291381835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,256,power_law_1.2,0.2320703983306885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,32,balanced,0.30268265803654987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,32,balanced,0.3029279907544454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,32,power_law_1.01,0.29957759380340576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,32,power_law_1.01,0.30100479125976565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,32,power_law_1.2,0.30855679512023926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,32,power_law_1.2,0.32283520698547363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,4,balanced,0.934058666229248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,4,balanced,0.9347573121388754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,4,power_law_1.01,0.8614656448364257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,4,power_law_1.01,0.8780608177185059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,4,power_law_1.2,0.8967167854309082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,4,power_law_1.2,0.9018176078796387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,64,balanced,0.2509866754213969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,64,balanced,0.2518720030784607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,64,power_law_1.01,0.25153279304504395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,64,power_law_1.01,0.2535680055618286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,64,power_law_1.2,0.26010239124298096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,64,power_law_1.2,0.2621119976043701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,8,balanced,0.5803146759668986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,8,balanced,0.5810720125834147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,8,power_law_1.01,0.566534423828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,8,power_law_1.01,0.5724287986755371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,8,power_law_1.2,0.5782464027404786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,1,8,power_law_1.2,0.5865600109100342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,16,1,balanced,0.4243146578470866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,16,1,balanced,0.42667198181152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,16,1,power_law_1.01,0.40597119331359866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,16,1,power_law_1.01,0.4064767837524414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,16,1,power_law_1.2,0.4104320049285889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,16,1,power_law_1.2,0.41152639389038087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,2,1,balanced,1.635002613067627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,2,1,balanced,1.6366453170776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,2,1,power_law_1.01,1.4776896476745605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,2,1,power_law_1.01,1.5077631950378418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,2,1,power_law_1.2,1.5491904258728026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,2,1,power_law_1.2,1.5560768127441407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,4,1,balanced,0.5677546660105387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,4,1,balanced,0.5686453183492025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,4,1,power_law_1.01,0.5899903774261475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,4,1,power_law_1.01,0.5958208084106446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,4,1,power_law_1.2,0.6061503887176514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,4,1,power_law_1.2,0.6120255947113037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,8,1,balanced,0.3670613368352254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,8,1,balanced,0.36872533957163495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,8,1,power_law_1.01,0.4025087833404541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,8,1,power_law_1.01,0.40723838806152346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,8,1,power_law_1.2,0.4083263874053955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,256,8,1,power_law_1.2,0.4102911949157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,1,balanced,4.497088114420573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,1,balanced,4.499402681986491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,1,power_law_1.01,3.7332225799560548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,1,power_law_1.01,3.734956741333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,1,power_law_1.2,3.789535903930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,1,power_law_1.2,3.861164855957031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,128,balanced,0.29452266295750934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,128,balanced,0.29500800371170044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,128,power_law_1.01,0.2925055980682373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,128,power_law_1.01,0.29322240352630613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,128,power_law_1.2,0.29482879638671877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,128,power_law_1.2,0.29500160217285154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,16,balanced,0.535151998202006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,16,balanced,0.5363146861394247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,16,power_law_1.01,0.4946752071380615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,16,power_law_1.01,0.5152512073516846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,16,power_law_1.2,0.5036928176879882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,16,power_law_1.2,0.5181951999664307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,2,balanced,2.3875999450683594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,2,balanced,2.3890719413757324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,2,power_law_1.01,2.0023679733276367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,2,power_law_1.01,2.0107967376708986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,2,power_law_1.2,1.969887924194336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,2,power_law_1.2,2.122336006164551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,32,balanced,0.40347198645273846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,32,balanced,0.4038933515548706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,32,power_law_1.01,0.37921919822692873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,32,power_law_1.01,0.3883455991744995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,32,power_law_1.2,0.3867072105407715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,32,power_law_1.2,0.38711678981781006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,4,balanced,1.3347573280334473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,4,balanced,1.337125301361084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,4,power_law_1.01,1.1362751960754394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,4,power_law_1.01,1.1528703689575195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,4,power_law_1.2,1.1587840080261231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,4,power_law_1.2,1.1748224258422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,64,balanced,0.3304266730944316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,64,balanced,0.3308746616045634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,64,power_law_1.01,0.3195904016494751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,64,power_law_1.01,0.32712318897247317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,64,power_law_1.2,0.324019193649292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,64,power_law_1.2,0.3384063959121704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,8,balanced,0.8083413441975912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,8,balanced,0.8085119724273682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,8,power_law_1.01,0.6843904018402099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,8,power_law_1.01,0.7506303787231445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,8,power_law_1.2,0.7085375785827637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,1,8,power_law_1.2,0.7112576007843018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,16,1,balanced,0.34570666154225665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,16,1,balanced,0.3495146830876668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,16,1,power_law_1.01,0.3312000036239624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,16,1,power_law_1.01,0.3327615976333618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,16,1,power_law_1.2,0.332473611831665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,16,1,power_law_1.2,0.3339967966079712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,2,1,balanced,2.3916640281677246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,2,1,balanced,2.3920960426330566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,2,1,power_law_1.01,1.9899328231811524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,2,1,power_law_1.01,2.0391359329223633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,2,1,power_law_1.2,1.9791423797607421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,2,1,power_law_1.2,2.032153511047363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,4,1,balanced,1.365381399790446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,4,1,balanced,1.368303934733073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,4,1,power_law_1.01,1.1453503608703612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,4,1,power_law_1.01,1.167852783203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,4,1,power_law_1.2,1.1443327903747558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,4,1,power_law_1.2,1.154252815246582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,8,1,balanced,0.484442671140035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,8,1,balanced,0.48717331886291504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,8,1,power_law_1.01,0.45620479583740237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,8,1,power_law_1.01,0.45688319206237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,8,1,power_law_1.2,0.4564352035522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,384,7168,2048,8,384,8,1,power_law_1.2,0.4591231822967529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,1,balanced,0.05403199791908264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,1,balanced,0.05454933146635691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,1,power_law_1.01,0.0523904025554657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,1,power_law_1.01,0.053376001119613645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,1,power_law_1.2,0.0514240026473999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,1,power_law_1.2,0.05198079943656921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,128,balanced,0.0356480007370313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,128,balanced,0.03774400055408478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,128,power_law_1.01,0.0344895988702774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,128,power_law_1.01,0.03596160113811493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,128,power_law_1.2,0.03527039885520935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,128,power_law_1.2,0.03534719944000244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,16,balanced,0.035690667728583016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,16,balanced,0.037461332976818085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,16,power_law_1.01,0.03622399866580963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,16,power_law_1.01,0.037222400307655334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,16,power_law_1.2,0.03700479865074158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,16,power_law_1.2,0.03720960021018982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,2,balanced,0.04597333570321401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,2,balanced,0.04816000163555145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,2,power_law_1.01,0.050470399856567386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,2,power_law_1.01,0.05113599896430969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,2,power_law_1.2,0.04818559885025024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,2,power_law_1.2,0.04917120039463043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,32,balanced,0.035887998839219414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,32,balanced,0.035904000202814736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,32,power_law_1.01,0.035743999481201175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,32,power_law_1.01,0.036236798763275145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,32,power_law_1.2,0.03591679930686951
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,32,power_law_1.2,0.03594880104064942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,4,balanced,0.03953066716591517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,4,balanced,0.04167466859022776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,4,power_law_1.01,0.046163201332092285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,4,power_law_1.01,0.04665600061416626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,4,power_law_1.2,0.045311999320983884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,4,power_law_1.2,0.045638400316238406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,64,balanced,0.03542399903138479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,64,balanced,0.03572266548871994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,64,power_law_1.01,0.034860798716545106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,64,power_law_1.01,0.03526400029659271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,64,power_law_1.2,0.03546879887580871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,64,power_law_1.2,0.03597440123558045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,8,balanced,0.03735466549793879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,8,balanced,0.03737599899371465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,8,power_law_1.01,0.04085119962692261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,8,power_law_1.01,0.04330880045890808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,8,power_law_1.2,0.04073599874973297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,1,8,power_law_1.2,0.0429504007101059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,2,1,balanced,0.0391839991013209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,2,1,balanced,0.039493332306543984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,2,1,power_law_1.01,0.04028159976005554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,2,1,power_law_1.01,0.04081920087337494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,2,1,power_law_1.2,0.04000000059604645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,2048,768,8,128,2,1,power_law_1.2,0.040115201473236085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,1,balanced,0.11691199739774068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,1,balanced,0.1179146667321523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,1,power_law_1.01,0.11308799982070923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,1,power_law_1.01,0.11414400339126587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,1,power_law_1.2,0.1126207947731018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,1,power_law_1.2,0.11342719793319703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,128,balanced,0.04200533529122671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,128,balanced,0.04371733466784159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,128,power_law_1.01,0.04105600118637085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,128,power_law_1.01,0.04268159866333008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,128,power_law_1.2,0.041510400176048276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,128,power_law_1.2,0.042105600237846375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,16,balanced,0.043738668163617454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,16,balanced,0.04428799947102865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,16,power_law_1.01,0.07528960108757018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,16,power_law_1.01,0.07552639842033386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,16,power_law_1.2,0.06712960004806519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,16,power_law_1.2,0.07212160229682922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,2,balanced,0.07592533528804779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,2,balanced,0.07820266485214233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,2,power_law_1.01,0.09056000113487243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,2,power_law_1.01,0.10687999725341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,2,power_law_1.2,0.08364800214767457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,2,power_law_1.2,0.09552639722824097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,256,balanced,0.04182933270931244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,256,balanced,0.04386133452256521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,256,power_law_1.01,0.041945600509643556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,256,power_law_1.01,0.04257279932498932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,256,power_law_1.2,0.04221439957618713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,256,power_law_1.2,0.04238080084323883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,32,balanced,0.043653334180514015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,32,balanced,0.04387199878692627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,32,power_law_1.01,0.057631999254226685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,32,power_law_1.01,0.05888640284538269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,32,power_law_1.2,0.058790397644042966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,32,power_law_1.2,0.0590399980545044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,4,balanced,0.059989333152770996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,4,balanced,0.0613973339398702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,4,power_law_1.01,0.08758400082588196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,4,power_law_1.01,0.08926079869270324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,4,power_law_1.2,0.07608960270881653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,4,power_law_1.2,0.07783039808273315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,64,balanced,0.043925335009892784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,64,balanced,0.043951998154322304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,64,power_law_1.01,0.04260480105876922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,64,power_law_1.01,0.04565759897232056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,64,power_law_1.2,0.04417920112609863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,64,power_law_1.2,0.04442879855632782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,8,balanced,0.050000001986821495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,8,balanced,0.052416001756985985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,8,power_law_1.01,0.08314239978790283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,8,power_law_1.01,0.08993279933929443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,8,power_law_1.2,0.06863359808921814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,1,8,power_law_1.2,0.07182719707489013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,2,1,balanced,0.06851199766000111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,2,1,balanced,0.06863466898600261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,2,1,power_law_1.01,0.06859520077705383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,2,1,power_law_1.01,0.06866559982299805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,2,1,power_law_1.2,0.0685375988483429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,2,1,power_law_1.2,0.06870399713516236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,4,1,balanced,0.05230399966239929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,4,1,balanced,0.05455466608206431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,4,1,power_law_1.01,0.05334399938583374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,4,1,power_law_1.01,0.05340800285339355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,4,1,power_law_1.2,0.053465598821640016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,3072,1536,8,256,4,1,power_law_1.2,0.053855997323989865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,1,balanced,0.28196267286936444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,1,balanced,0.2834560076395671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,1,power_law_1.01,0.19290879964828492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,1,power_law_1.01,0.21957759857177733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,1,power_law_1.2,0.18778239488601683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,1,power_law_1.2,0.19980159997940064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,2,balanced,0.1994346578915914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,2,balanced,0.2012373407681783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,2,power_law_1.01,0.1587648034095764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,2,power_law_1.01,0.17288960218429567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,2,power_law_1.2,0.15292799472808838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,2,power_law_1.2,0.16610560417175294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,4,balanced,0.1441439986228943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,4,balanced,0.14920533696810404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,4,power_law_1.01,0.13018879890441895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,4,power_law_1.01,0.1335360050201416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,4,power_law_1.2,0.1449280023574829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,4,power_law_1.2,0.1652992010116577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,8,balanced,0.1274720033009847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,8,balanced,0.12774933377901712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,8,power_law_1.01,0.12649600505828856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,8,power_law_1.01,0.12679680585861205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,8,power_law_1.2,0.1268671989440918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,1,8,power_law_1.2,0.1281280040740967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,16,1,balanced,0.049584001302719116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,16,1,balanced,0.05189333359400431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,16,1,power_law_1.01,0.0471231997013092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,16,1,power_law_1.01,0.047328001260757445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,16,1,power_law_1.2,0.04597119987010956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,16,1,power_law_1.2,0.0487744003534317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,2,1,balanced,0.15968533356984457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,2,1,balanced,0.16037866473197937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,2,1,power_law_1.01,0.10755840539932252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,2,1,power_law_1.01,0.11472640037536622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,2,1,power_law_1.2,0.10723199844360351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,2,1,power_law_1.2,0.11295360326766968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,4,1,balanced,0.09662399689356486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,4,1,balanced,0.10017599662144978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,4,1,power_law_1.01,0.07671040296554565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,4,1,power_law_1.01,0.08429440259933471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,4,1,power_law_1.2,0.07498239874839782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,4,1,power_law_1.2,0.07504640221595764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,8,1,balanced,0.06392533580462138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,8,1,balanced,0.06563200056552887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,8,1,power_law_1.01,0.053337597846984865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,8,1,power_law_1.01,0.05431039929389954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,8,1,power_law_1.2,0.057657599449157715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,14336,2,8,8,1,power_law_1.2,0.05863040089607239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,1,balanced,0.14289599657058716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,1,balanced,0.14364266395568848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,1,power_law_1.01,0.14238719940185546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,1,power_law_1.01,0.1429695963859558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,1,power_law_1.2,0.13319679498672485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,1,power_law_1.2,0.13911039829254152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,128,balanced,0.0460746685663859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,128,balanced,0.046165332198143005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,128,power_law_1.01,0.04467839896678925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,128,power_law_1.01,0.04469119906425476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,128,power_law_1.2,0.044614401459693906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,128,power_law_1.2,0.046163201332092285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,16,balanced,0.047600001096725464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,16,balanced,0.04809600114822388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,16,power_law_1.01,0.06590719819068909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,16,power_law_1.01,0.06787840127944947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,16,power_law_1.2,0.0658240020275116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,16,power_law_1.2,0.06666880249977111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,2,balanced,0.08832533160845439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,2,balanced,0.08884800473848979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,2,power_law_1.01,0.10030080080032348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,2,power_law_1.01,0.10140800476074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,2,power_law_1.2,0.09535359740257263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,2,power_law_1.2,0.09616000056266785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,32,balanced,0.04568000137805939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,32,balanced,0.0459146648645401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,32,power_law_1.01,0.04986880123615265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,32,power_law_1.01,0.0543615996837616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,32,power_law_1.2,0.05030400156974792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,32,power_law_1.2,0.05511040091514587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,4,balanced,0.06877866884072621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,4,balanced,0.06961599985758464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,4,power_law_1.01,0.0794048011302948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,4,power_law_1.01,0.08325120210647582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,4,power_law_1.2,0.07743359804153442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,4,power_law_1.2,0.08335999846458435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,64,balanced,0.045781334241231285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,64,balanced,0.04766400158405304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,64,power_law_1.01,0.045203199982643126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,64,power_law_1.01,0.04565120041370392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,64,power_law_1.2,0.04527359902858734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,64,power_law_1.2,0.045407998561859134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,8,balanced,0.05594133337338766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,8,balanced,0.05876266459623972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,8,power_law_1.01,0.07514879703521729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,8,power_law_1.01,0.07634559869766236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,8,power_law_1.2,0.06995199918746949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,1,8,power_law_1.2,0.07196800112724304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,2,1,balanced,0.08115200201670329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,2,1,balanced,0.08155733346939087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,2,1,power_law_1.01,0.07916160225868225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,2,1,power_law_1.01,0.07919359803199769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,2,1,power_law_1.2,0.07705600261688232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,2,1,power_law_1.2,0.07930240035057068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,4,1,balanced,0.0625546673933665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,4,1,balanced,0.06372799972693126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,4,1,power_law_1.01,0.06021760106086731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,4,1,power_law_1.01,0.06034560203552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,4,1,power_law_1.2,0.05991680026054382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,1536,8,128,4,1,power_law_1.2,0.060102397203445436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,1,balanced,0.49582401911417645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,1,balanced,0.49963200092315674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,1,power_law_1.01,0.49672961235046387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,1,power_law_1.01,0.4995264053344727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,1,power_law_1.2,0.4969600200653076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,1,power_law_1.2,0.4990528106689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,128,balanced,0.052298665046691895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,128,balanced,0.05416533350944519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,128,power_law_1.01,0.07249280214309692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,128,power_law_1.01,0.0725055992603302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,128,power_law_1.2,0.0723583996295929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,128,power_law_1.2,0.07271040081977845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,16,balanced,0.08983467022577922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,16,balanced,0.08994666735331218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,16,power_law_1.01,0.2041088104248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,16,power_law_1.01,0.2212991952896118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,16,power_law_1.2,0.21668479442596436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,16,power_law_1.2,0.22200961112976075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,2,balanced,0.293232003847758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,2,balanced,0.2936319907506307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,2,power_law_1.01,0.35971200466156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,2,power_law_1.01,0.3603327989578247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,2,power_law_1.2,0.3504960060119629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,2,power_law_1.2,0.3708992004394531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,256,balanced,0.05406400064627329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,256,power_law_1.01,0.05467519760131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,256,power_law_1.01,0.05824000239372253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,256,power_law_1.2,0.05867519974708557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,256,power_law_1.2,0.05978879928588867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,32,balanced,0.07786133388678233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,32,balanced,0.07861333092053731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,32,power_law_1.01,0.13868160247802735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,32,power_law_1.01,0.13915519714355468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,32,power_law_1.2,0.13819520473480223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,32,power_law_1.2,0.1392192006111145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,4,balanced,0.17706666390101114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,4,balanced,0.17748800913492838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,4,power_law_1.01,0.2902719974517822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,4,power_law_1.01,0.29323520660400393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,4,power_law_1.2,0.28460159301757815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,4,power_law_1.2,0.2937855958938599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,64,balanced,0.07036266724268596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,64,balanced,0.07041599849859874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,64,power_law_1.01,0.08609279990196228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,64,power_law_1.01,0.08798720240592957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,64,power_law_1.2,0.08602880239486695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,64,power_law_1.2,0.0870848000049591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,8,balanced,0.11148800452550252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,8,balanced,0.11183999975522359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,8,power_law_1.01,0.2405440092086792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,8,power_law_1.01,0.26150400638580323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,8,power_law_1.2,0.23484160900115966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,4096,2688,22,512,1,8,power_law_1.2,0.23767681121826173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,1,balanced,0.4443039894104004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,1,balanced,0.44706666469573975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,1,power_law_1.01,0.2907711982727051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,1,power_law_1.01,0.2977407932281494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,1,power_law_1.2,0.305676794052124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,1,power_law_1.2,0.3138240098953247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,2,balanced,0.2900373339653015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,2,balanced,0.30032533407211304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,2,power_law_1.01,0.23522560596466063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,2,power_law_1.01,0.2888704061508179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,2,power_law_1.2,0.19237120151519777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,2,power_law_1.2,0.19966720342636107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,4,balanced,0.1859040061632792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,4,balanced,0.18784000476201376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,4,power_law_1.01,0.1642624020576477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,4,power_law_1.01,0.17895040512084961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,4,power_law_1.2,0.16223360300064088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,4,power_law_1.2,0.1688704013824463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,8,balanced,0.15863466262817383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,8,balanced,0.15908799568812051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,8,power_law_1.01,0.15641599893569946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,8,power_law_1.01,0.15696640014648439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,8,power_law_1.2,0.157151997089386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,1,8,power_law_1.2,0.177510404586792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,16,1,balanced,0.06599466502666473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,16,1,balanced,0.06758399804433186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,16,1,power_law_1.01,0.06110720038414001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,16,1,power_law_1.01,0.06142079830169678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,16,1,power_law_1.2,0.0605184018611908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,16,1,power_law_1.2,0.06113280057907104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,2,1,balanced,0.2353973388671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,2,1,balanced,0.2364693284034729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,2,1,power_law_1.01,0.15201280117034913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,2,1,power_law_1.01,0.16698240041732787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,2,1,power_law_1.2,0.16631679534912108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,2,1,power_law_1.2,0.16872960329055786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,32,1,balanced,0.0551146666208903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,32,1,balanced,0.056362668673197426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,32,1,power_law_1.01,0.051097601652145386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,32,1,power_law_1.01,0.051667201519012454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,32,1,power_law_1.2,0.04930559992790222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,32,1,power_law_1.2,0.051635199785232545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,4,1,balanced,0.13242133458455405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,4,1,balanced,0.1607146660486857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,4,1,power_law_1.01,0.09701120257377624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,4,1,power_law_1.01,0.10034559965133667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,4,1,power_law_1.2,0.09612799882888794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,4,1,power_law_1.2,0.10126719474792481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,8,1,balanced,0.09266666571299235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,8,1,balanced,0.09277866284052531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,8,1,power_law_1.01,0.07728639841079712
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,8,1,power_law_1.01,0.08103039860725403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,8,1,power_law_1.2,0.07036799788475037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,16384,2,8,8,1,power_law_1.2,0.07297919988632202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,1,balanced,0.23112533489863077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,1,balanced,0.23430933554967245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,1,power_law_1.01,0.23100800514221193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,1,power_law_1.01,0.2318592071533203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,1,power_law_1.2,0.2300800085067749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,1,power_law_1.2,0.23162240982055665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,128,balanced,0.05605333546797434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,128,balanced,0.05606399973233541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,128,power_law_1.01,0.06023039817810059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,128,power_law_1.01,0.06633599996566772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,128,power_law_1.2,0.05859839916229248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,128,power_law_1.2,0.06222720146179199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,16,balanced,0.06257600088914235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,16,balanced,0.06403733293215434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,16,power_law_1.01,0.13986560106277465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,16,power_law_1.01,0.1406399965286255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,16,power_law_1.2,0.13066879510879517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,16,power_law_1.2,0.13110400438308717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,2,balanced,0.14256532986958823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,2,balanced,0.1455680032571157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,2,power_law_1.01,0.2059391975402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,2,power_law_1.01,0.21556479930877687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,2,power_law_1.2,0.18883199691772462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,2,power_law_1.2,0.19990400075912476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,256,balanced,0.05597866574923197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,256,balanced,0.05598400036493937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,256,power_law_1.01,0.05408639907836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,256,power_law_1.01,0.054790401458740236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,256,power_law_1.2,0.05372160077095032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,256,power_law_1.2,0.056403201818466184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,32,balanced,0.055946667989095054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,32,balanced,0.05628266433874766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,32,power_law_1.01,0.09571200013160705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,32,power_law_1.01,0.09738879799842834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,32,power_law_1.2,0.09496960043907166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,32,power_law_1.2,0.09612159729003907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,4,balanced,0.09902399778366089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,4,balanced,0.09954133629798889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,4,power_law_1.01,0.18509440422058104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,4,power_law_1.01,0.19375360012054443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,4,power_law_1.2,0.163481605052948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,4,power_law_1.2,0.1703935980796814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,64,balanced,0.055999999245007835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,64,balanced,0.056101332108179726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,64,power_law_1.01,0.07734400033950806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,64,power_law_1.01,0.07748479843139648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,64,power_law_1.2,0.07804800271987915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,64,power_law_1.2,0.0788096010684967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,8,balanced,0.07657599945863088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,8,balanced,0.07732800145943959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,8,power_law_1.01,0.1682368040084839
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,8,power_law_1.01,0.1834879994392395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,8,power_law_1.2,0.1369920015335083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,1,8,power_law_1.2,0.15421439409255983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,16,1,balanced,0.05996799965699514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,16,1,balanced,0.060191998879114784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,16,1,power_law_1.01,0.060121601819992064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,16,1,power_law_1.01,0.060812801122665405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,16,1,power_law_1.2,0.06050559878349304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,16,1,power_law_1.2,0.060684800148010254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,2,1,balanced,0.13221333424250284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,2,1,balanced,0.13326932986577353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,2,1,power_law_1.01,0.13052799701690673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,2,1,power_law_1.01,0.13119360208511352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,2,1,power_law_1.2,0.12999680042266845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,2,1,power_law_1.2,0.13078399896621704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,4,1,balanced,0.08816533287366231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,4,1,balanced,0.08879466851552327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,4,1,power_law_1.01,0.08709120154380798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,4,1,power_law_1.01,0.08817279934883118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,4,1,power_law_1.2,0.08759040236473084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,4,1,power_law_1.2,0.08796799778938294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,8,1,balanced,0.07649600009123485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,8,1,balanced,0.0782293329636256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,8,1,power_law_1.01,0.07624959945678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,8,1,power_law_1.01,0.07705600261688232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,8,1,power_law_1.2,0.07649919986724854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2048,8,256,8,1,power_law_1.2,0.07669119834899903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,1,balanced,0.29741867383321124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,1,balanced,0.2976693312327067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,1,power_law_1.01,0.2940671920776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,1,power_law_1.01,0.2948863983154297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,1,power_law_1.2,0.29395840167999265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,1,power_law_1.2,0.29512319564819334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,16,balanced,0.07204266885916392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,16,balanced,0.07249066730340321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,16,power_law_1.01,0.11205120086669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,16,power_law_1.01,0.1160256028175354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,16,power_law_1.2,0.11611520051956177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,16,power_law_1.2,0.11801600456237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,2,balanced,0.18829333782196045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,2,balanced,0.19105066855748495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,2,power_law_1.01,0.20456960201263427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,2,power_law_1.01,0.20773119926452638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,2,power_law_1.2,0.21350400447845458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,2,power_law_1.2,0.21724801063537597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,32,balanced,0.058101331194241844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,32,balanced,0.05810666580994924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,32,power_law_1.01,0.08748800158500672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,32,power_law_1.01,0.08820480108261108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,32,power_law_1.2,0.08737919926643371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,32,power_law_1.2,0.088646399974823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,4,balanced,0.10603732864061992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,4,balanced,0.1074026624361674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,4,power_law_1.01,0.13627519607543945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,4,power_law_1.01,0.17299840450286866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,4,power_law_1.2,0.16338560581207276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,4,power_law_1.2,0.16535680294036864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,8,balanced,0.08750933408737183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,8,balanced,0.08768533666928609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,8,power_law_1.01,0.1386304020881653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,8,power_law_1.01,0.15890560150146485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,8,power_law_1.2,0.151910400390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,1,8,power_law_1.2,0.15859199762344361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,2,1,balanced,0.17864533265431723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,2,1,balanced,0.1787733236948649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,2,1,power_law_1.01,0.17566720247268677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,2,1,power_law_1.01,0.17681920528411865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,2,1,power_law_1.2,0.17396479845046997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,2,1,power_law_1.2,0.1774399995803833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,4,1,balanced,0.10087999701499939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,4,1,balanced,0.10090133547782898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,4,1,power_law_1.01,0.0985535979270935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,4,1,power_law_1.01,0.09878399968147278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,4,1,power_law_1.2,0.09674879908561707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,6144,2560,8,160,4,1,power_law_1.2,0.09832320213317872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,1,balanced,0.2658133308092753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,1,balanced,0.26709334055582684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,1,power_law_1.01,0.2647104024887085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,1,power_law_1.01,0.26659839153289794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,1,power_law_1.2,0.2642751932144165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,1,power_law_1.2,0.26626560688018797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,128,balanced,0.058090666929880776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,128,balanced,0.05985599756240845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,128,power_law_1.01,0.07114880084991455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,128,power_law_1.01,0.07320320010185241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,128,power_law_1.2,0.07311360239982605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,128,power_law_1.2,0.07457919716835022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,16,balanced,0.07231999933719635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,16,balanced,0.0729066679875056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,16,power_law_1.01,0.156985604763031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,16,power_law_1.01,0.1573248028755188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,16,power_law_1.2,0.14344320297241211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,16,power_law_1.2,0.14747519493103028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,2,balanced,0.1585493286450704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,2,balanced,0.1609173317750295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,2,power_law_1.01,0.23260800838470458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,2,power_law_1.01,0.24298880100250245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,2,power_law_1.2,0.23454079627990723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,2,power_law_1.2,0.23827838897705078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,256,balanced,0.060122668743133545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,256,balanced,0.06190933287143707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,256,power_law_1.01,0.057580798864364624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,256,power_law_1.01,0.05899519920349121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,256,power_law_1.2,0.05877760052680969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,256,power_law_1.2,0.058899199962615965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,32,balanced,0.058186665177345276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,32,balanced,0.060090666015942894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,32,power_law_1.01,0.1051967978477478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,32,power_law_1.01,0.10537600517272949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,32,power_law_1.2,0.10483839511871337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,32,power_law_1.2,0.10545920133590699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,4,balanced,0.10920000076293945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,4,balanced,0.10929066936175029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,4,power_law_1.01,0.20019199848175048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,4,power_law_1.01,0.22547199726104736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,4,power_law_1.2,0.1683519959449768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,4,power_law_1.2,0.18026880025863648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,64,balanced,0.0612960010766983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,64,balanced,0.06198933223883311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,64,power_law_1.01,0.08407679796218873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,64,power_law_1.01,0.08426880240440368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,64,power_law_1.2,0.08410239815711976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,64,power_law_1.2,0.08535040020942689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,8,balanced,0.08117333551247914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,8,balanced,0.084389328956604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,8,power_law_1.01,0.19457919597625734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,8,power_law_1.01,0.2039936065673828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,8,power_law_1.2,0.17655680179595948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,1,8,power_law_1.2,0.17990399599075318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,16,1,balanced,0.06825600067774455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,16,1,balanced,0.06851733227570851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,16,1,power_law_1.01,0.06791039705276489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,16,1,power_law_1.01,0.0683135986328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,16,1,power_law_1.2,0.06836479902267456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,16,1,power_law_1.2,0.06840959787368775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,2,1,balanced,0.14732799927393594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,2,1,balanced,0.1479680041472117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,2,1,power_law_1.01,0.14646400213241578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,2,1,power_law_1.01,0.14702080488204955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,2,1,power_law_1.2,0.14594559669494628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,2,1,power_law_1.2,0.14709119796752929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,4,1,balanced,0.09851200381914775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,4,1,balanced,0.09878399968147278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,4,1,power_law_1.01,0.0969215989112854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,4,1,power_law_1.01,0.0976960003376007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,4,1,power_law_1.2,0.09711359739303589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,4,1,power_law_1.2,0.09747840166091919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,8,1,balanced,0.08660800258318584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,8,1,balanced,0.08666132887204488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,8,1,power_law_1.01,0.085971200466156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,8,1,power_law_1.01,0.0861631989479065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,8,1,power_law_1.2,0.08486400246620178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,256,8,1,power_law_1.2,0.08496000170707703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,1,balanced,0.26553599039713544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,1,balanced,0.27089067300160724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,1,power_law_1.01,0.2640320062637329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,1,power_law_1.01,0.2650048017501831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,1,power_law_1.2,0.26414079666137696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,1,power_law_1.2,0.26540799140930177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,128,balanced,0.05807999769846598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,128,balanced,0.06004266440868378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,128,power_law_1.01,0.07895680069923401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,128,power_law_1.01,0.07909119725227357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,128,power_law_1.2,0.07870720028877258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,128,power_law_1.2,0.07984640002250672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,16,balanced,0.07138133545716603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,16,balanced,0.07625600198904674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,16,power_law_1.01,0.23255679607391358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,16,power_law_1.01,0.24087040424346923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,16,power_law_1.2,0.22831358909606933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,16,power_law_1.2,0.2307391881942749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,2,balanced,0.15607466300328574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,2,balanced,0.1561973293622335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,2,power_law_1.01,0.2736255884170532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,2,power_law_1.01,0.27596158981323243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,2,power_law_1.2,0.24869120121002197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,2,power_law_1.2,0.2492608070373535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,32,balanced,0.05997333427270254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,32,balanced,0.0641546646753947
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,32,power_law_1.01,0.13595520257949828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,32,power_law_1.01,0.13648639917373656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,32,power_law_1.2,0.13473279476165773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,32,power_law_1.2,0.13583999872207642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,4,balanced,0.10703466335932414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,4,balanced,0.109333336353302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,4,power_law_1.01,0.2676480054855347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,4,power_law_1.01,0.2728384017944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,4,power_law_1.2,0.23074560165405272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,4,power_law_1.2,0.24050559997558593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,64,balanced,0.060175999999046326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,64,balanced,0.062224000692367554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,64,power_law_1.01,0.09244800209999085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,64,power_law_1.01,0.09247360229492188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,64,power_law_1.2,0.09184640049934387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,64,power_law_1.2,0.09253759980201721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,8,balanced,0.08650133013725281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,8,balanced,0.08683733145395915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,8,power_law_1.01,0.2716032028198242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,8,power_law_1.01,0.2739903926849365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,8,power_law_1.2,0.22815361022949218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,1,8,power_law_1.2,0.2332672119140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,16,1,balanced,0.06205333272616068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,16,1,balanced,0.06362666686375935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,16,1,power_law_1.01,0.060652798414230345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,16,1,power_law_1.01,0.0617792010307312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,16,1,power_law_1.2,0.06202239990234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,16,1,power_law_1.2,0.06221439838409424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,2,1,balanced,0.14803199966748556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,2,1,balanced,0.1481226682662964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,2,1,power_law_1.01,0.14652160406112671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,2,1,power_law_1.01,0.14670720100402831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,2,1,power_law_1.2,0.14561280012130737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,2,1,power_law_1.2,0.1459391951560974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,4,1,balanced,0.09724799791971843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,4,1,balanced,0.09865599870681763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,4,1,power_law_1.01,0.09662079811096191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,4,1,power_law_1.01,0.09712640047073365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,4,1,power_law_1.2,0.09755520224571228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,4,1,power_law_1.2,0.09797120094299316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,8,1,balanced,0.07276799778143565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,8,1,balanced,0.07285333176453908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,8,1,power_law_1.01,0.0707647979259491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,8,1,power_law_1.01,0.07151359915733338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,8,1,power_law_1.2,0.07081599831581116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4,7168,2048,8,384,8,1,power_law_1.2,0.07123839855194092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,1,balanced,0.8871466318766276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,1,balanced,0.8880266348520914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,1,power_law_1.01,0.9339903831481934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,1,power_law_1.01,0.9359231948852539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,1,power_law_1.2,0.9345855712890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,1,power_law_1.2,0.9369791984558106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,128,balanced,0.3373333215713501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,128,balanced,0.33852267265319824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,128,power_law_1.01,0.36488320827484133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,128,power_law_1.01,0.36659200191497804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,128,power_law_1.2,0.39779200553894045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,128,power_law_1.2,0.39882240295410154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,16,balanced,0.37040531635284424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,16,balanced,0.37071998914082843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,16,power_law_1.01,0.4175680160522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,16,power_law_1.01,0.4188096046447754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,16,power_law_1.2,0.43029122352600097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,16,power_law_1.2,0.43125119209289553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,2,balanced,0.6396053234736124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,2,balanced,0.6424746513366699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,2,power_law_1.01,0.6966271877288819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,2,power_law_1.01,0.7024256229400635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,2,power_law_1.2,0.7263167858123779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,2,power_law_1.2,0.7372928142547608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,32,balanced,0.35149868329366046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,32,balanced,0.351583997408549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,32,power_law_1.01,0.39017601013183595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,32,power_law_1.01,0.3944511890411377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,32,power_law_1.2,0.40787200927734374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,32,power_law_1.2,0.41528959274291993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,4,balanced,0.4883413314819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,4,balanced,0.48934932549794513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,4,power_law_1.01,0.5431551933288574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,4,power_law_1.01,0.5550911903381348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,4,power_law_1.2,0.5556608200073242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,4,power_law_1.2,0.5695744037628174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,64,balanced,0.3407786687215169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,64,balanced,0.34325865904490155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,64,power_law_1.01,0.37452800273895265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,64,power_law_1.01,0.38754560947418215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,64,power_law_1.2,0.398144006729126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,64,power_law_1.2,0.408787202835083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,8,balanced,0.4096533457438151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,8,balanced,0.4102453390757243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,8,power_law_1.01,0.46588802337646484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,8,power_law_1.01,0.4778304100036621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,8,power_law_1.2,0.4847616195678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,1,8,power_law_1.2,0.4850048065185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,2,1,balanced,0.5506986776987711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,2,1,balanced,0.5509119828542074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,2,1,power_law_1.01,0.5828224182128906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,2,1,power_law_1.01,0.5868224143981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,2,1,power_law_1.2,0.584659194946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,2048,768,8,128,2,1,power_law_1.2,0.5856256008148193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,1,balanced,2.273578643798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,1,balanced,2.274639924367269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,1,power_law_1.01,2.7533248901367187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,1,power_law_1.01,2.7536832809448244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,1,power_law_1.2,2.7878976821899415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,1,power_law_1.2,2.7957952499389647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,128,balanced,0.5671519835789999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,128,balanced,0.5684266487757365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,128,power_law_1.01,0.632755184173584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,128,power_law_1.01,0.6336128234863281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,128,power_law_1.2,0.6685823917388916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,128,power_law_1.2,0.6833343982696534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,16,balanced,0.6674346923828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,16,balanced,0.6682773431142172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,16,power_law_1.01,0.7801919937133789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,16,power_law_1.01,0.7863359928131104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,16,power_law_1.2,0.8080448150634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,16,power_law_1.2,0.8137984275817871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,2,balanced,1.4484532674153645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,2,balanced,1.4503733317057292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,2,power_law_1.01,1.7256895065307618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,2,power_law_1.01,1.800454330444336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,2,power_law_1.2,1.7940992355346679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,2,power_law_1.2,1.866156768798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,256,balanced,0.5622826814651489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,256,balanced,0.562602678934733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,256,power_law_1.01,0.6056640148162842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,256,power_law_1.01,0.6062975883483886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,256,power_law_1.2,0.6463295936584472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,256,power_law_1.2,0.6500351905822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,32,balanced,0.6096906661987305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,32,balanced,0.6109919945398966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,32,power_law_1.01,0.7081920146942139
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,32,power_law_1.01,0.7175551891326905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,32,power_law_1.2,0.7240831851959229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,32,power_law_1.2,0.7402175903320313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,4,balanced,1.0049013296763103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,4,balanced,1.0054879983266194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,4,power_law_1.01,1.207545566558838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,4,power_law_1.01,1.2153471946716308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,4,power_law_1.2,1.2477503776550294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,4,power_law_1.2,1.2789183616638184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,64,balanced,0.5806560118993124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,64,balanced,0.5825706720352173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,64,power_law_1.01,0.654150390625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,64,power_law_1.01,0.660972785949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,64,power_law_1.2,0.6762176036834717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,64,power_law_1.2,0.6854464054107666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,8,balanced,0.7832852999369303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,8,balanced,0.7847306728363037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,8,power_law_1.01,0.9297408103942871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,8,power_law_1.01,0.9393024444580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,8,power_law_1.2,0.9783167839050293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,1,8,power_law_1.2,1.0006143569946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,2,1,balanced,1.3089599609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,2,1,balanced,1.3090506394704182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,2,1,power_law_1.01,1.54835844039917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,2,1,power_law_1.01,1.5487872123718263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,2,1,power_law_1.2,1.570201587677002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,2,1,power_law_1.2,1.5843328475952148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,4,1,balanced,0.8166933059692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,4,1,balanced,0.8171892960866293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,4,1,power_law_1.01,0.9467071533203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,4,1,power_law_1.01,0.9478591918945313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,4,1,power_law_1.2,0.9596480369567871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,3072,1536,8,256,4,1,power_law_1.2,0.9636351585388183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,1,balanced,5.528645197550456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,1,balanced,5.531781514485677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,1,power_law_1.01,5.683660888671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,1,power_law_1.01,5.700236892700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,1,power_law_1.2,5.689164733886718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,1,power_law_1.2,5.692262268066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,2,balanced,3.185647964477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,2,balanced,3.1906185150146484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,2,power_law_1.01,3.9792831420898436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,2,power_law_1.01,4.552422332763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,2,power_law_1.2,3.7903297424316404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,2,power_law_1.2,4.385555267333984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,4,balanced,2.057466665903727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,4,balanced,2.059903939565023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,4,power_law_1.01,3.1603200912475584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,4,power_law_1.01,3.218431854248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,4,power_law_1.2,3.271744155883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,4,power_law_1.2,3.4047168731689452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,8,balanced,1.4387946128845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,8,balanced,1.44158935546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,8,power_law_1.01,2.9117504119873048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,8,power_law_1.01,2.9614015579223634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,8,power_law_1.2,2.973324775695801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,1,8,power_law_1.2,3.012563133239746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,16,1,balanced,0.481386661529541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,16,1,balanced,0.4829973379770915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,16,1,power_law_1.01,0.47737598419189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,16,1,power_law_1.01,0.483571195602417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,16,1,power_law_1.2,0.4798912048339844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,16,1,power_law_1.2,0.4799168109893799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,2,1,balanced,2.795584042867025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,2,1,balanced,2.7983999252319336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,2,1,power_law_1.01,2.8354944229125976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,2,1,power_law_1.01,2.8500415802001955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,2,1,power_law_1.2,2.841958427429199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,2,1,power_law_1.2,2.842848014831543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,4,1,balanced,1.469930648803711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,4,1,balanced,1.4706346193949382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,4,1,power_law_1.01,1.4772992134094238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,4,1,power_law_1.01,1.4907967567443847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,4,1,power_law_1.2,1.4770943641662597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,4,1,power_law_1.2,1.4887104034423828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,8,1,balanced,0.8103626569112142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,8,1,balanced,0.8128426869710287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,8,1,power_law_1.01,0.8044544219970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,8,1,power_law_1.01,0.8141951560974121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,8,1,power_law_1.2,0.7991040229797364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,14336,2,8,8,1,power_law_1.2,0.8030719757080078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,1,balanced,2.751615842183431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,1,balanced,2.755610783894857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,1,power_law_1.01,3.0247039794921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,1,power_law_1.01,3.0410943984985352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,1,power_law_1.2,3.0198272705078124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,1,power_law_1.2,3.023539161682129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,128,balanced,0.6071093479792277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,128,balanced,0.6085919936498007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,128,power_law_1.01,0.7181119918823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,128,power_law_1.01,0.7320256233215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,128,power_law_1.2,0.8184320449829101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,128,power_law_1.2,0.8232255935668945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,16,balanced,0.7315786679585775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,16,balanced,0.7320426305135092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,16,power_law_1.01,0.8963135719299317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,16,power_law_1.01,0.9327743530273438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,16,power_law_1.2,0.929043197631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,16,power_law_1.2,1.0183103561401368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,2,balanced,1.7170987129211426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,2,balanced,1.7184373537699382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,2,power_law_1.01,2.022694396972656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,2,power_law_1.01,2.0369216918945314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,2,power_law_1.2,1.9666879653930665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,2,power_law_1.2,1.9891584396362305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,32,balanced,0.6595199902852377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,32,balanced,0.6625386476516724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,32,power_law_1.01,0.810035228729248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,32,power_law_1.01,0.8262784004211425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,32,power_law_1.2,0.8839232444763183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,32,power_law_1.2,0.8917183876037598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,4,balanced,1.15720534324646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,4,balanced,1.1587680180867512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,4,power_law_1.01,1.3494015693664552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,4,power_law_1.01,1.3731328010559083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,4,power_law_1.2,1.3904319763183595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,4,power_law_1.2,1.4299200057983399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,64,balanced,0.6253066857655843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,64,balanced,0.6260906855265299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,64,power_law_1.01,0.7578368186950684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,64,power_law_1.01,0.7615295886993408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,64,power_law_1.2,0.8116288185119629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,64,power_law_1.2,0.8354240417480469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,8,balanced,0.8776319821675619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,8,balanced,0.8785706361134847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,8,power_law_1.01,1.0615679740905761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,8,power_law_1.01,1.0948479652404786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,8,power_law_1.2,1.0835328102111816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,1,8,power_law_1.2,1.1789504051208497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,2,1,balanced,1.567072073618571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,2,1,balanced,1.5711520512898762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,2,1,power_law_1.01,1.6531391143798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,2,1,power_law_1.01,1.6531583786010742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,2,1,power_law_1.2,1.655583953857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,2,1,power_law_1.2,1.6557888031005858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,4,1,balanced,0.975221316019694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,4,1,balanced,0.9759946664174398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,4,1,power_law_1.01,1.0404224395751953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,4,1,power_law_1.01,1.0404416084289552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,4,1,power_law_1.2,1.041651153564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,1536,8,128,4,1,power_law_1.2,1.0441791534423828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,1,balanced,13.594144185384115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,1,balanced,13.595760345458984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,1,power_law_1.01,14.814656066894532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,1,power_law_1.01,14.843014526367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,1,power_law_1.2,14.952716064453124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,1,power_law_1.2,15.000364685058594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,128,balanced,2.264794667561849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,128,balanced,2.2663680712381997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,128,power_law_1.01,2.5111871719360352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,128,power_law_1.01,2.5231679916381835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,128,power_law_1.2,2.621075248718262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,128,power_law_1.2,2.636524772644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,16,balanced,2.9105494817097983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,16,balanced,2.915973345438639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,16,power_law_1.01,3.3021823883056642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,16,power_law_1.01,3.317900848388672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,16,power_law_1.2,3.53125114440918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,16,power_law_1.2,3.588556671142578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,2,balanced,7.997999827067058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,2,balanced,7.998314539591472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,2,power_law_1.01,8.8797119140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,2,power_law_1.01,8.909939575195313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,2,power_law_1.2,9.073260498046874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,2,power_law_1.2,9.297811126708984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,256,balanced,2.219088077545166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,256,balanced,2.22763729095459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,256,power_law_1.01,2.407251167297363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,256,power_law_1.01,2.425836753845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,256,power_law_1.2,2.515072059631348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,256,power_law_1.2,2.599763107299805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,32,balanced,2.5429333051045737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,32,balanced,2.5429919560750327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,32,power_law_1.01,2.86812801361084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,32,power_law_1.01,2.89052791595459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,32,power_law_1.2,2.965100860595703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,32,power_law_1.2,3.0106239318847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,4,balanced,5.0929867426554365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,4,balanced,5.097802797953288
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,4,power_law_1.01,5.871775817871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,4,power_law_1.01,6.005215835571289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,4,power_law_1.2,5.905523300170898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,4,power_law_1.2,6.066873550415039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,64,balanced,2.357855955759684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,64,balanced,2.367311954498291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,64,power_law_1.01,2.6268415451049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,64,power_law_1.01,2.646463966369629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,64,power_law_1.2,2.7815040588378905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,64,power_law_1.2,2.785152053833008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,8,balanced,3.6452159881591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,8,balanced,3.653514544169108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,8,power_law_1.01,4.250112152099609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,8,power_law_1.01,4.262764739990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,8,power_law_1.2,4.333875274658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,4096,2688,22,512,1,8,power_law_1.2,4.49119987487793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,1,balanced,8.923962910970053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,1,balanced,8.926767985026041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,1,power_law_1.01,9.147206115722657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,1,power_law_1.01,9.155039978027343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,1,power_law_1.2,9.137868499755859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,1,power_law_1.2,9.166598510742187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,2,balanced,5.016016006469727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,2,balanced,5.0188798904418945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,2,power_law_1.01,6.517497253417969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,2,power_law_1.01,7.75137939453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,2,power_law_1.2,6.948601531982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,2,power_law_1.2,7.296851348876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,4,balanced,3.0474398930867515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,4,balanced,3.0497919718424478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,4,power_law_1.01,4.960211181640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,4,power_law_1.01,5.72284164428711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,4,power_law_1.2,4.951200103759765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,4,power_law_1.2,5.399135971069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,8,balanced,1.996554692586263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,8,balanced,1.9970506032307942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,8,power_law_1.01,4.363558578491211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,8,power_law_1.01,4.75103988647461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,8,power_law_1.2,4.735340881347656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,1,8,power_law_1.2,4.855340957641602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,16,1,balanced,0.7440053621927897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,16,1,balanced,0.7456746896107992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,16,1,power_law_1.01,0.7476096153259277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,16,1,power_law_1.01,0.7498239994049072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,16,1,power_law_1.2,0.7394559860229493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,16,1,power_law_1.2,0.7444672107696533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,2,1,balanced,4.527173360188802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,2,1,balanced,4.535189310709636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,2,1,power_law_1.01,4.586438369750977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,2,1,power_law_1.01,4.5984447479248045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,2,1,power_law_1.2,4.576480102539063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,2,1,power_law_1.2,4.608000183105469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,32,1,balanced,0.492847998936971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,32,1,balanced,0.4945760170618693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,32,1,power_law_1.01,0.4864384174346924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,32,1,power_law_1.01,0.48850560188293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,32,1,power_law_1.2,0.4791872024536133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,32,1,power_law_1.2,0.481657600402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,4,1,balanced,2.3769706090291343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,4,1,balanced,2.377509276072184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,4,1,power_law_1.01,2.4010047912597656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,4,1,power_law_1.01,2.408684730529785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,4,1,power_law_1.2,2.4006591796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,4,1,power_law_1.2,2.4015871047973634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,8,1,balanced,1.2865973313649495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,8,1,balanced,1.2893386681874592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,8,1,power_law_1.01,1.2960831642150878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,8,1,power_law_1.01,1.3003520011901855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,8,1,power_law_1.2,1.2888895988464355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,16384,2,8,8,1,power_law_1.2,1.2913663864135743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,1,balanced,5.321338653564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,1,balanced,5.322405179341634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,1,power_law_1.01,6.556755065917969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,1,power_law_1.01,6.586022186279297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,1,power_law_1.2,6.675328063964844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,1,power_law_1.2,6.724646759033203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,128,balanced,0.8965173562367758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,128,balanced,0.898149331410726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,128,power_law_1.01,1.0233216285705566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,128,power_law_1.01,1.0733183860778808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,128,power_law_1.2,1.1668031692504883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,128,power_law_1.2,1.1743167877197265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,16,balanced,1.1544426282246907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,16,balanced,1.1594399611155193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,16,power_law_1.01,1.4510272026062012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,16,power_law_1.01,1.477228832244873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,16,power_law_1.2,1.528812789916992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,16,power_law_1.2,1.6204479217529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,2,balanced,3.1556641260782876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,2,balanced,3.1585280100504556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,2,power_law_1.01,3.8214656829833986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,2,power_law_1.01,3.9974910736083986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,2,power_law_1.2,3.9892608642578127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,2,power_law_1.2,4.1424705505371096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,256,balanced,0.8817760149637858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,256,balanced,0.8831626574198405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,256,power_law_1.01,0.9940671920776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,256,power_law_1.01,1.0000063896179199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,256,power_law_1.2,1.093280029296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,256,power_law_1.2,1.0982080459594727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,32,balanced,1.008639971415202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,32,balanced,1.0093973477681477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,32,power_law_1.01,1.2273856163024903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,32,power_law_1.01,1.255033588409424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,32,power_law_1.2,1.3605119705200195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,32,power_law_1.2,1.3884287834167481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,4,balanced,2.018330732981364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,4,balanced,2.0209919611612954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,4,power_law_1.01,2.543737602233887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,4,power_law_1.01,2.5682239532470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,4,power_law_1.2,2.6248064041137695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,4,power_law_1.2,2.683078384399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,64,balanced,0.9360640048980713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,64,balanced,0.9374667008717855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,64,power_law_1.01,1.117568016052246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,64,power_law_1.01,1.1206080436706543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,64,power_law_1.2,1.2589376449584961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,64,power_law_1.2,1.3411007881164552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,8,balanced,1.4051146507263184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,8,balanced,1.4053227106730144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,8,power_law_1.01,1.7978368759155274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,8,power_law_1.01,1.8456575393676757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,8,power_law_1.2,1.8512256622314454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,1,8,power_law_1.2,1.8666368484497071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,16,1,balanced,0.9258506298065186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,16,1,balanced,0.9274400075276693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,16,1,power_law_1.01,1.0429311752319337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,16,1,power_law_1.01,1.0484607696533204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,16,1,power_law_1.2,1.0523839950561524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,16,1,power_law_1.2,1.054361629486084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,2,1,balanced,2.9383519490559897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,2,1,balanced,2.9413601557413735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,2,1,power_law_1.01,3.595840072631836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,2,1,power_law_1.01,3.606156921386719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,2,1,power_law_1.2,3.6594879150390627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,2,1,power_law_1.2,3.6676990509033205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,4,1,balanced,1.7168854077657063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,4,1,balanced,1.7173760732014973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,4,1,power_law_1.01,2.058745574951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,4,1,power_law_1.01,2.06426887512207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,4,1,power_law_1.2,2.088159942626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,4,1,power_law_1.2,2.091596794128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,8,1,balanced,2.234517256418864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,8,1,balanced,2.23470401763916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,8,1,power_law_1.01,2.4885759353637695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,8,1,power_law_1.01,2.4899200439453124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,8,1,power_law_1.2,2.5950271606445314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2048,8,256,8,1,power_law_1.2,2.6050304412841796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,1,balanced,7.53927485148112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,1,balanced,7.557727813720703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,1,power_law_1.01,7.232749176025391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,1,power_law_1.01,7.261376190185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,1,power_law_1.2,7.257977294921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,1,power_law_1.2,7.292755126953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,16,balanced,1.3489333788553874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,16,balanced,1.3511734008789062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,16,power_law_1.01,1.591916847229004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,16,power_law_1.01,1.7276800155639649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,16,power_law_1.2,1.8887680053710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,16,power_law_1.2,1.944268798828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,2,balanced,4.290863990783691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,2,balanced,4.292069435119629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,2,power_law_1.01,4.515615844726563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,2,power_law_1.01,4.553478240966797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,2,power_law_1.2,4.4568126678466795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,2,power_law_1.2,4.596326446533203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,32,balanced,1.1331466833750408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,32,balanced,1.1332320372263591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,32,power_law_1.01,1.3885248184204102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,32,power_law_1.01,1.4822272300720214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,32,power_law_1.2,1.6883007049560548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,32,power_law_1.2,1.7444927215576171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,4,balanced,2.5338719685872397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,4,balanced,2.5351573626200357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,4,power_law_1.01,2.8236608505249023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,4,power_law_1.01,2.8671615600585936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,4,power_law_1.2,2.984294319152832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,4,power_law_1.2,2.9850175857543944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,8,balanced,1.7353119850158691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,8,balanced,1.735322634379069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,8,power_law_1.01,1.9540224075317383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,8,power_law_1.01,2.0473663330078127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,8,power_law_1.2,2.2393215179443358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,1,8,power_law_1.2,2.3648895263671874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,2,1,balanced,4.09060796101888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,2,1,balanced,4.091914812723796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,2,1,power_law_1.01,3.9111934661865235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,2,1,power_law_1.01,3.922681427001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,2,1,power_law_1.2,3.9191616058349608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,2,1,power_law_1.2,3.9431617736816404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,4,1,balanced,2.333343982696533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,4,1,balanced,2.334895928700765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,4,1,power_law_1.01,2.1856191635131834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,4,1,power_law_1.01,2.1993535995483398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,4,1,power_law_1.2,2.196748733520508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,6144,2560,8,160,4,1,power_law_1.2,2.2047231674194334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,1,balanced,6.126442591349284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,1,balanced,6.135274887084961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,1,power_law_1.01,7.557299041748047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,1,power_law_1.01,7.579283142089844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,1,power_law_1.2,7.753254699707031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,1,power_law_1.2,7.807405090332031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,128,balanced,0.9705066680908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,128,balanced,0.9743093649546305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,128,power_law_1.01,1.1560383796691895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,128,power_law_1.01,1.1820480346679687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,128,power_law_1.2,1.2565631866455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,128,power_law_1.2,1.2833791732788087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,16,balanced,1.2749439875284831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,16,balanced,1.2768320242563884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,16,power_law_1.01,1.5780608177185058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,16,power_law_1.01,1.5833855628967286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,16,power_law_1.2,1.694905662536621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,16,power_law_1.2,1.7581184387207032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,2,balanced,3.611290613810221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,2,balanced,3.619050661722819
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,2,power_law_1.01,4.554764938354492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,2,power_law_1.01,4.6451904296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,2,power_law_1.2,4.539193725585937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,2,power_law_1.2,4.548262405395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,256,balanced,0.9528160095214844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,256,balanced,0.9545760154724121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,256,power_law_1.01,1.0880831718444823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,256,power_law_1.01,1.09869441986084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,256,power_law_1.2,1.2306303977966309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,256,power_law_1.2,1.246342372894287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,32,balanced,1.104698657989502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,32,balanced,1.1069546540578206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,32,power_law_1.01,1.3259263992309571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,32,power_law_1.01,1.3499903678894043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,32,power_law_1.2,1.4606080055236816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,32,power_law_1.2,1.4625791549682616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,4,balanced,2.279850641886393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,4,balanced,2.2830026944478354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,4,power_law_1.01,2.8952896118164064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,4,power_law_1.01,2.9860160827636717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,4,power_law_1.2,2.9759103775024416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,4,power_law_1.2,2.9785280227661133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,64,balanced,1.0171199639638264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,64,balanced,1.0195146401723225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,64,power_law_1.01,1.254047966003418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,64,power_law_1.01,1.2679936408996582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,64,power_law_1.2,1.338163185119629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,64,power_law_1.2,1.3565759658813477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,8,balanced,1.557802677154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,8,balanced,1.5602025985717773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,8,power_law_1.01,1.9285184860229492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,8,power_law_1.01,2.068684768676758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,8,power_law_1.2,2.2088191986083983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,1,8,power_law_1.2,2.2425792694091795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,16,1,balanced,1.0698293050130208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,16,1,balanced,1.0698346296946208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,16,1,power_law_1.01,1.2073344230651855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,16,1,power_law_1.01,1.2111807823181153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,16,1,power_law_1.2,1.2137280464172364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,16,1,power_law_1.2,1.2139455795288085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,2,1,balanced,3.395770708719889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,2,1,balanced,3.401050567626953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,2,1,power_law_1.01,4.179155349731445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,2,1,power_law_1.01,4.179417419433594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,2,1,power_law_1.2,4.236179351806641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,2,1,power_law_1.2,4.244627380371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,4,1,balanced,1.9647307395935059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,4,1,balanced,1.9654879570007324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,4,1,power_law_1.01,2.3680511474609376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,4,1,power_law_1.01,2.3738943099975587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,4,1,power_law_1.2,2.4120000839233398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,4,1,power_law_1.2,2.420748710632324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,8,1,balanced,2.5907413164774575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,8,1,balanced,2.5911839803059897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,8,1,power_law_1.01,2.8978111267089846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,8,1,power_law_1.01,2.953683280944824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,8,1,power_law_1.2,3.0173887252807616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,256,8,1,power_law_1.2,3.0367679595947266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,1,balanced,8.762896219889322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,1,balanced,8.767274856567383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,1,power_law_1.01,8.542400360107422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,1,power_law_1.01,8.551289367675782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,1,power_law_1.2,8.854662322998047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,1,power_law_1.2,8.860102081298828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,128,balanced,1.0494720141092937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,128,balanced,1.050821304321289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,128,power_law_1.01,1.1990592002868652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,128,power_law_1.01,1.2041919708251954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,128,power_law_1.2,1.2662079811096192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,128,power_law_1.2,1.2892416000366211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,16,balanced,1.4898026784261067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,16,balanced,1.4912959734598796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,16,power_law_1.01,1.6972032546997071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,16,power_law_1.01,1.7036096572875976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,16,power_law_1.2,1.7786687850952148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,16,power_law_1.2,1.8257152557373046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,2,balanced,4.937413215637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,2,balanced,4.938501358032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,2,power_law_1.01,5.044038391113281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,2,power_law_1.01,5.068838500976563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,2,power_law_1.2,5.180294418334961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,2,power_law_1.2,5.231980895996093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,32,balanced,1.2418346405029297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,32,balanced,1.2439893086751301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,32,power_law_1.01,1.4019647598266602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,32,power_law_1.01,1.4036224365234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,32,power_law_1.2,1.4922112464904784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,32,power_law_1.2,1.5031488418579102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,4,balanced,2.9702186584472656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,4,balanced,2.975488026936849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,4,power_law_1.01,3.1793920516967775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,4,power_law_1.01,3.2159488677978514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,4,power_law_1.2,3.2551551818847657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,4,power_law_1.2,3.427827072143555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,64,balanced,1.1131306489308674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,64,balanced,1.1164320309956868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,64,power_law_1.01,1.2761152267456055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,64,power_law_1.01,1.3014335632324219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,64,power_law_1.2,1.3381183624267579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,64,power_law_1.2,1.3501248359680176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,8,balanced,1.9846080144246419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,8,balanced,1.984922726949056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,8,power_law_1.01,2.2058879852294924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,8,power_law_1.01,2.229727935791016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,8,power_law_1.2,2.245484733581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,1,8,power_law_1.2,2.3446847915649416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,16,1,balanced,1.2999040285746257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,16,1,balanced,1.30349866549174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,16,1,power_law_1.01,1.364863967895508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,16,1,power_law_1.01,1.3663616180419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,16,1,power_law_1.2,1.3982784271240234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,16,1,power_law_1.2,1.4003968238830566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,2,1,balanced,4.753039995829265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,2,1,balanced,4.755578676859538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,2,1,power_law_1.01,4.655168151855468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,2,1,power_law_1.01,4.664883041381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,2,1,power_law_1.2,4.8499198913574215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,2,1,power_law_1.2,4.866617584228516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,4,1,balanced,2.784634590148926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,4,1,balanced,2.786410649617513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,4,1,power_law_1.01,2.7337472915649412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,4,1,power_law_1.01,2.75283203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,4,1,power_law_1.2,2.822707176208496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,4,1,power_law_1.2,2.8351295471191404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,8,1,balanced,1.801695982615153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,8,1,balanced,1.8048213322957356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,8,1,power_law_1.01,1.7686656951904296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,8,1,power_law_1.01,1.7730047225952148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,8,1,power_law_1.2,1.7977344512939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,4096,7168,2048,8,384,8,1,power_law_1.2,1.8162687301635743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,1,balanced,0.1409173309803009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,1,balanced,0.141866664091746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,1,power_law_1.01,0.12878079414367677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,1,power_law_1.01,0.12942080497741698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,1,power_law_1.2,0.13144960403442382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,1,power_law_1.2,0.1341375946998596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,128,balanced,0.03907199949026108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,128,balanced,0.0397173340121905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,128,power_law_1.01,0.03820799887180328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,128,power_law_1.01,0.03857280015945434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,128,power_law_1.2,0.03806079924106598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,128,power_law_1.2,0.03816959857940674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,16,balanced,0.04351999859015147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,16,balanced,0.04357333481311798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,16,power_law_1.01,0.04207360148429871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,16,power_law_1.01,0.04220159947872162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,16,power_law_1.2,0.04199039936065674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,16,power_law_1.2,0.042131200432777405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,2,balanced,0.0951039989789327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,2,balanced,0.09692266583442688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,2,power_law_1.01,0.08951039910316468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,2,power_law_1.01,0.09073920249938965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,2,power_law_1.2,0.08935040235519409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,2,power_law_1.2,0.09072639942169189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,32,balanced,0.0397119993964831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,32,balanced,0.03979733337958654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,32,power_law_1.01,0.038380798697471616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,32,power_law_1.01,0.03863680064678192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,32,power_law_1.2,0.03845120072364807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,32,power_law_1.2,0.03903999924659729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,4,balanced,0.063509335120519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,4,balanced,0.06413333117961884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,4,power_law_1.01,0.06035199761390686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,4,power_law_1.01,0.06105599999427795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,4,power_law_1.2,0.06094080209732056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,4,power_law_1.2,0.061862397193908694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,64,balanced,0.03976533313592275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,64,balanced,0.039808000127474465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,64,power_law_1.01,0.0377920001745224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,64,power_law_1.01,0.0384768009185791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,64,power_law_1.2,0.03834240138530731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,64,power_law_1.2,0.0385343998670578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,8,balanced,0.05603733162085215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,8,balanced,0.05643199880917867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,8,power_law_1.01,0.05187199711799621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,8,power_law_1.01,0.053497600555419925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,8,power_law_1.2,0.052070397138595584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,1,8,power_law_1.2,0.05374079942703247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,2,1,balanced,0.09779733419418335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,2,1,balanced,0.09849599997202556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,2,1,power_law_1.01,0.09027199745178223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,2,1,power_law_1.01,0.09072639942169189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,2,1,power_law_1.2,0.09086080193519593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,2048,768,8,128,2,1,power_law_1.2,0.0924351990222931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,1,balanced,0.6173439820607504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,1,balanced,0.6189759969711304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,1,power_law_1.01,0.4512063980102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,1,power_law_1.01,0.46341118812561033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,1,power_law_1.2,0.45372800827026366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,1,power_law_1.2,0.453766393661499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,128,balanced,0.054101333022117615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,128,balanced,0.054431999723116554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,128,power_law_1.01,0.050918400287628174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,128,power_law_1.01,0.05134080052375793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,128,power_law_1.2,0.05160319805145264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,128,power_law_1.2,0.05182719826698303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,16,balanced,0.08032000064849854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,16,balanced,0.080485333998998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,16,power_law_1.01,0.07598080039024353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,16,power_law_1.01,0.07700480222702026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,16,power_law_1.2,0.07701119780540466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,16,power_law_1.2,0.07835519909858704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,2,balanced,0.34009067217508954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,2,balanced,0.3449653387069702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,2,power_law_1.01,0.26074240207672117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,2,power_law_1.01,0.26696319580078126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,2,power_law_1.2,0.2568320035934448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,2,power_law_1.2,0.27077760696411135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,256,balanced,0.050800000627835594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,256,balanced,0.05218133330345154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,256,power_law_1.01,0.04961279928684235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,256,power_law_1.01,0.05006080269813538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,256,power_law_1.2,0.04872319996356964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,256,power_law_1.2,0.04883840084075928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,32,balanced,0.06854400038719177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,32,balanced,0.07152533531188965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,32,power_law_1.01,0.06483839750289917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,32,power_law_1.01,0.06757760047912598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,32,power_law_1.2,0.06570879817008972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,32,power_law_1.2,0.0666815996170044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,4,balanced,0.1948960026105245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,4,balanced,0.1958400011062622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,4,power_law_1.01,0.15139199495315553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,4,power_law_1.01,0.1575744032859802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,4,power_law_1.2,0.16725120544433594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,4,power_law_1.2,0.17075200080871583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,64,balanced,0.05667200187842051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,64,balanced,0.05783999959627787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,64,power_law_1.01,0.05591679811477661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,64,power_law_1.01,0.057760000228881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,64,power_law_1.2,0.05467519760131836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,64,power_law_1.2,0.05500800013542175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,8,balanced,0.12812266747156778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,8,balanced,0.1281760036945343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,8,power_law_1.01,0.11399040222167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,8,power_law_1.01,0.12076159715652465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,8,power_law_1.2,0.10318080186843873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,1,8,power_law_1.2,0.11564160585403442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,2,1,balanced,0.3365973234176636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,2,1,balanced,0.33847999572753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,2,1,power_law_1.01,0.25490560531616213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,2,1,power_law_1.01,0.25829119682312013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,2,1,power_law_1.2,0.24952960014343262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,2,1,power_law_1.2,0.25107200145721437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,4,1,balanced,0.2051573395729065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,4,1,balanced,0.20586133003234863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,4,1,power_law_1.01,0.15113600492477416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,4,1,power_law_1.01,0.15449600219726561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,4,1,power_law_1.2,0.15244799852371216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,3072,1536,8,256,4,1,power_law_1.2,0.15397119522094727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,1,balanced,0.3059893250465393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,1,balanced,0.3079520066579183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,1,power_law_1.01,0.2993216037750244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,1,power_law_1.01,0.3060287952423096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,1,power_law_1.2,0.3053247928619385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,1,power_law_1.2,0.31230080127716064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,2,balanced,0.216922660668691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,2,balanced,0.23383466402689615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,2,power_law_1.01,0.22996480464935304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,2,power_law_1.01,0.2310784101486206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,2,power_law_1.2,0.22547199726104736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,2,power_law_1.2,0.2315903902053833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,4,balanced,0.1585599978764852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,4,balanced,0.1590559979279836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,4,power_law_1.01,0.18997759819030763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,4,power_law_1.01,0.19315840005874635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,4,power_law_1.2,0.19498879909515382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,4,power_law_1.2,0.19557119607925416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,8,balanced,0.14754666884740195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,8,balanced,0.149536003669103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,8,power_law_1.01,0.1640447974205017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,8,power_law_1.01,0.17007360458374024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,8,power_law_1.2,0.17034239768981935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,1,8,power_law_1.2,0.17668479681015015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,16,1,balanced,0.053717335065205894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,16,1,balanced,0.05614933371543884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,16,1,power_law_1.01,0.0525439977645874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,16,1,power_law_1.01,0.05303679704666138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,16,1,power_law_1.2,0.05248000025749207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,16,1,power_law_1.2,0.05628799796104431
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,2,1,balanced,0.1685333251953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,2,1,balanced,0.16943466663360596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,2,1,power_law_1.01,0.1683519959449768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,2,1,power_law_1.01,0.17782399654388428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,2,1,power_law_1.2,0.17338240146636963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,2,1,power_law_1.2,0.17562240362167358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,4,1,balanced,0.09922666351000468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,4,1,balanced,0.10124799609184265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,4,1,power_law_1.01,0.10191359519958496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,4,1,power_law_1.01,0.10240000486373901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,4,1,power_law_1.2,0.1019968032836914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,4,1,power_law_1.2,0.10520960092544555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,8,1,balanced,0.0710346649090449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,8,1,balanced,0.07238399982452393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,8,1,power_law_1.01,0.06945279836654664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,8,1,power_law_1.01,0.07066879868507385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,8,1,power_law_1.2,0.06998400092124939
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,14336,2,8,8,1,power_law_1.2,0.06999679803848266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,1,balanced,0.43165866533915204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,1,balanced,0.4319893519083659
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,1,power_law_1.01,0.38172159194946287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,1,power_law_1.01,0.3841471910476685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,1,power_law_1.2,0.38952319622039794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,1,power_law_1.2,0.3958336114883423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,128,balanced,0.05671999851862589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,128,balanced,0.05778133372465769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,128,power_law_1.01,0.053273600339889524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,128,power_law_1.01,0.05451520085334778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,128,power_law_1.2,0.05507199764251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,128,power_law_1.2,0.055289602279663085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,16,balanced,0.07998933394749959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,16,balanced,0.080485333998998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,16,power_law_1.01,0.07509120106697083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,16,power_law_1.01,0.08076800107955932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,16,power_law_1.2,0.07809280157089234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,16,power_law_1.2,0.07936639785766601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,2,balanced,0.24374399582544962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,2,balanced,0.2462666630744934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,2,power_law_1.01,0.2265536069869995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,2,power_law_1.01,0.2266752004623413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,2,power_law_1.2,0.22884480953216552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,2,power_law_1.2,0.23132801055908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,32,balanced,0.06656000018119812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,32,balanced,0.07001600166161855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,32,power_law_1.01,0.06181120276451111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,32,power_law_1.01,0.06475520133972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,32,power_law_1.2,0.06258559823036194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,32,power_law_1.2,0.06444799900054932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,4,balanced,0.15475199619928995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,4,balanced,0.15826666355133057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,4,power_law_1.01,0.14577920436859132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,4,power_law_1.01,0.1502784013748169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,4,power_law_1.2,0.14264320135116576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,4,power_law_1.2,0.1450816035270691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,64,balanced,0.058890665570894875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,64,balanced,0.05913066864013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,64,power_law_1.01,0.056518399715423585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,64,power_law_1.01,0.05767040252685547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,64,power_law_1.2,0.05631359815597534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,64,power_law_1.2,0.05868800282478333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,8,balanced,0.09256533781687419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,8,balanced,0.09274666508038838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,8,power_law_1.01,0.08967679738998413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,8,power_law_1.01,0.08969600200653076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,8,power_law_1.2,0.08972160220146179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,1,8,power_law_1.2,0.09052799940109253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,2,1,balanced,0.23898667097091675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,2,1,balanced,0.23937066396077475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,2,1,power_law_1.01,0.21868159770965576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,2,1,power_law_1.01,0.22439041137695312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,2,1,power_law_1.2,0.2247744083404541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,2,1,power_law_1.2,0.22669439315795897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,4,1,balanced,0.15939733386039734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,4,1,balanced,0.15991999705632529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,4,1,power_law_1.01,0.14704639911651612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,4,1,power_law_1.01,0.15264639854431153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,4,1,power_law_1.2,0.14908159971237184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,1536,8,128,4,1,power_law_1.2,0.15041919946670532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,1,balanced,2.7147998809814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,1,balanced,2.7163146336873374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,1,power_law_1.01,2.1449344635009764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,1,power_law_1.01,2.1728384017944338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,1,power_law_1.2,2.1378496170043944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,1,power_law_1.2,2.1906944274902345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,128,balanced,0.09649599591890971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,128,balanced,0.1002400020758311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,128,power_law_1.01,0.09626240134239197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,128,power_law_1.01,0.0969983994960785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,128,power_law_1.2,0.09279999732971192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,128,power_law_1.2,0.09580159783363343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,16,balanced,0.24642133712768555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,16,balanced,0.24688533941904703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,16,power_law_1.01,0.2197567939758301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,16,power_law_1.01,0.23664000034332275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,16,power_law_1.2,0.21696000099182128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,16,power_law_1.2,0.2203455924987793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,2,balanced,1.3923892974853516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,2,balanced,1.3940320014953613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,2,power_law_1.01,1.1470975875854492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,2,power_law_1.01,1.1874176025390626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,2,power_law_1.2,1.1369407653808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,2,power_law_1.2,1.1892992019653321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,256,balanced,0.0867786705493927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,256,balanced,0.09054932991663615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,256,power_law_1.01,0.08662400245666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,256,power_law_1.01,0.08842880129814149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,256,power_law_1.2,0.08666239976882935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,256,power_law_1.2,0.08982399702072144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,32,balanced,0.16290133198102316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,32,balanced,0.16386133432388306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,32,power_law_1.01,0.1475200057029724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,32,power_law_1.01,0.15148799419403075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,32,power_law_1.2,0.15358079671859742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,32,power_law_1.2,0.15542399883270264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,4,balanced,0.738368034362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,4,balanced,0.7392586867014567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,4,power_law_1.01,0.5989888191223145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,4,power_law_1.01,0.6108992099761963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,4,power_law_1.2,0.5867584228515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,4,power_law_1.2,0.6069952011108398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,64,balanced,0.11176533500353496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,64,balanced,0.11199999849001567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,64,power_law_1.01,0.10734080076217652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,64,power_law_1.01,0.10873600244522094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,64,power_law_1.2,0.10428800582885742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,64,power_law_1.2,0.10707839727401733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,8,balanced,0.40508798758188885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,8,balanced,0.40760000546773273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,8,power_law_1.01,0.3607104063034058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,8,power_law_1.01,0.3803839921951294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,8,power_law_1.2,0.33352959156036377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,4096,2688,22,512,1,8,power_law_1.2,0.3559423923492432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,1,balanced,0.4630613327026367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,1,balanced,0.4639093478520711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,1,power_law_1.01,0.4755904197692871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,1,power_law_1.01,0.4775424003601074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,1,power_law_1.2,0.47361278533935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,1,power_law_1.2,0.4770815849304199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,2,balanced,0.3115520079930623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,2,balanced,0.3548640012741089
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,2,power_law_1.01,0.3336704015731812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,2,power_law_1.01,0.3373503923416138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,2,power_law_1.2,0.33489279747009276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,2,power_law_1.2,0.33972480297088625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,4,balanced,0.20874667167663574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,4,balanced,0.2102186679840088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,4,power_law_1.01,0.2568831920623779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,4,power_law_1.01,0.266758394241333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,4,power_law_1.2,0.2535936117172241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,4,power_law_1.2,0.25873920917510984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,8,balanced,0.18133866786956787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,8,balanced,0.18518400192260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,8,power_law_1.01,0.1923967957496643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,8,power_law_1.01,0.2131200075149536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,8,power_law_1.2,0.20714240074157714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,1,8,power_law_1.2,0.23145599365234376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,16,1,balanced,0.07381333410739899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,16,1,balanced,0.07449066638946533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,16,1,power_law_1.01,0.07283200025558471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,16,1,power_law_1.01,0.07296000123023987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,16,1,power_law_1.2,0.0723136007785797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,16,1,power_law_1.2,0.07283200025558471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,2,1,balanced,0.24665600061416626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,2,1,balanced,0.24887466430664062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,2,1,power_law_1.01,0.26654078960418703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,2,1,power_law_1.01,0.26858880519866946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,2,1,power_law_1.2,0.26537599563598635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,2,1,power_law_1.2,0.2712831974029541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,32,1,balanced,0.05990933378537496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,32,1,balanced,0.06214400132497152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,32,1,power_law_1.01,0.05761920213699341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,32,1,power_law_1.01,0.05861759781837463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,32,1,power_law_1.2,0.057811200618743896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,32,1,power_law_1.2,0.05865600109100342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,4,1,balanced,0.1399786671002706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,4,1,balanced,0.15059733390808105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,4,1,power_law_1.01,0.157043194770813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,4,1,power_law_1.01,0.16325759887695312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,4,1,power_law_1.2,0.15291520357131957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,4,1,power_law_1.2,0.15994880199432374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,8,1,balanced,0.09493333101272583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,8,1,balanced,0.099781334400177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,8,1,power_law_1.01,0.0924351990222931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,8,1,power_law_1.01,0.09376639723777772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,8,1,power_law_1.2,0.09236479997634887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,16384,2,8,8,1,power_law_1.2,0.09260159730911255
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,1,balanced,1.5632960001627605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,1,balanced,1.5690773328145344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,1,power_law_1.01,1.1460864067077636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,1,power_law_1.01,1.1544511795043946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,1,power_law_1.2,1.1110591888427734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,1,power_law_1.2,1.1339136123657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,128,balanced,0.07972800234953563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,128,balanced,0.08248533308506012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,128,power_law_1.01,0.07942399978637696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,128,power_law_1.01,0.08256639838218689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,128,power_law_1.2,0.0766592025756836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,128,power_law_1.2,0.08155519962310791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,16,balanced,0.14940266807874045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,16,balanced,0.15172800421714783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,16,power_law_1.01,0.13430399894714357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,16,power_law_1.01,0.14551680088043212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,16,power_law_1.2,0.13289599418640136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,16,power_law_1.2,0.14450559616088868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,2,balanced,0.8132373491923014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,2,balanced,0.8136746883392334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,2,power_law_1.01,0.6276671886444092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,2,power_law_1.01,0.6488448143005371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,2,power_law_1.2,0.5920447826385498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,2,power_law_1.2,0.6420608043670655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,256,balanced,0.07116266588370006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,256,balanced,0.07241599758466084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,256,power_law_1.01,0.07085440158843995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,256,power_law_1.01,0.07090560197830201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,256,power_law_1.2,0.07015680074691773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,256,power_law_1.2,0.07215999960899352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,32,balanced,0.10828800002733867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,32,balanced,0.10979732871055603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,32,power_law_1.01,0.10090880393981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,32,power_law_1.01,0.10176639556884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,32,power_law_1.2,0.10188800096511841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,32,power_law_1.2,0.10476160049438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,4,balanced,0.44571733474731445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,4,balanced,0.4464000066121419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,4,power_law_1.01,0.38300158977508547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,4,power_law_1.01,0.4113152027130127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,4,power_law_1.2,0.38056321144104005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,4,power_law_1.2,0.3857919931411743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,64,balanced,0.0940106709798177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,64,balanced,0.09708799918492635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,64,power_law_1.01,0.09264000058174134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,64,power_law_1.01,0.09322879910469055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,64,power_law_1.2,0.09106559753417968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,64,power_law_1.2,0.09296640157699584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,8,balanced,0.24485333760579428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,8,balanced,0.2460106611251831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,8,power_law_1.01,0.23418879508972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,8,power_law_1.01,0.23617920875549317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,8,power_law_1.2,0.22028160095214844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,1,8,power_law_1.2,0.2388672113418579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,16,1,balanced,0.1812266707420349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,16,1,balanced,0.18204265832901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,16,1,power_law_1.01,0.14142080545425414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,16,1,power_law_1.01,0.14320000410079955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,16,1,power_law_1.2,0.14134399890899657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,16,1,power_law_1.2,0.14184319972991943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,2,1,balanced,0.8053920269012451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,2,1,balanced,0.8057440121968588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,2,1,power_law_1.01,0.5882880210876464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,2,1,power_law_1.01,0.5922815799713135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,2,1,power_law_1.2,0.575820779800415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,2,1,power_law_1.2,0.587334394454956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,4,1,balanced,0.45451200008392334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,4,1,balanced,0.45465068022410077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,4,1,power_law_1.01,0.3445312023162842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,4,1,power_law_1.01,0.34622719287872317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,4,1,power_law_1.2,0.3337984085083008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,4,1,power_law_1.2,0.3394815921783447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,8,1,balanced,0.3075466752052307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,8,1,balanced,0.31275200843811035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,8,1,power_law_1.01,0.2116863965988159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,8,1,power_law_1.01,0.21187200546264648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,8,1,power_law_1.2,0.20439679622650148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2048,8,256,8,1,power_law_1.2,0.20841600894927978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,1,balanced,1.239840030670166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,1,balanced,1.2465173403422039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,1,power_law_1.01,1.0324224472045898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,1,power_law_1.01,1.0481151580810546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,1,power_law_1.2,1.0291839599609376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,1,power_law_1.2,1.0372223854064941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,16,balanced,0.12590932846069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,16,balanced,0.12595733006795248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,16,power_law_1.01,0.11763839721679688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,16,power_law_1.01,0.1196671962738037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,16,power_law_1.2,0.1201856017112732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,16,power_law_1.2,0.1220736026763916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,2,balanced,0.6618933280309042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,2,balanced,0.663045326868693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,2,power_law_1.01,0.5311744213104248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,2,power_law_1.01,0.575648021697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,2,power_law_1.2,0.566374397277832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,2,power_law_1.2,0.5674880027770997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,32,balanced,0.10733866691589355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,32,balanced,0.10971200466156006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,32,power_law_1.01,0.10645760297775268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,32,power_law_1.01,0.10772479772567749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,32,power_law_1.2,0.10584959983825684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,32,power_law_1.2,0.10629119873046874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,4,balanced,0.3574506839116414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,4,balanced,0.35849066575368244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,4,power_law_1.01,0.3204416036605835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,4,power_law_1.01,0.33183999061584474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,4,power_law_1.2,0.30589439868927004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,4,power_law_1.2,0.3232703924179077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,8,balanced,0.23933333158493042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,8,balanced,0.24021865924199423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,8,power_law_1.01,0.2151103973388672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,8,power_law_1.01,0.2212735891342163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,8,power_law_1.2,0.2133631944656372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,1,8,power_law_1.2,0.21368319988250734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,2,1,balanced,0.6555573145548502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,2,1,balanced,0.6565599838892618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,2,1,power_law_1.01,0.5488639831542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,2,1,power_law_1.01,0.5500288009643555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,2,1,power_law_1.2,0.5544320106506347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,2,1,power_law_1.2,0.5557568073272705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,4,1,balanced,0.35891199111938477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,4,1,balanced,0.36101333300272626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,4,1,power_law_1.01,0.31877760887145995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,4,1,power_law_1.01,0.3206592082977295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,4,1,power_law_1.2,0.31880960464477537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,6144,2560,8,160,4,1,power_law_1.2,0.31994879245758057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,1,balanced,1.8265493710835774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,1,balanced,1.8380427360534668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,1,power_law_1.01,1.3164287567138673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,1,power_law_1.01,1.3409215927124023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,1,power_law_1.2,1.300870418548584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,1,power_law_1.2,1.3189888000488281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,128,balanced,0.0906933347384135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,128,balanced,0.09154133001963298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,128,power_law_1.01,0.09079679846763611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,128,power_law_1.01,0.09223679900169372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,128,power_law_1.2,0.08809599876403809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,128,power_law_1.2,0.08947839736938476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,16,balanced,0.16521599888801575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,16,balanced,0.16528000434239706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,16,power_law_1.01,0.15088640451431273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,16,power_law_1.01,0.1544000029563904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,16,power_law_1.2,0.1601215958595276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,16,power_law_1.2,0.1602560043334961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,2,balanced,0.9471039772033691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,2,balanced,0.9499413172403971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,2,power_law_1.01,0.7112319946289063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,2,power_law_1.01,0.7208000183105469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,2,power_law_1.2,0.7480959892272949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,2,power_law_1.2,0.7509183883666992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,256,balanced,0.07874666651089986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,256,balanced,0.08065066734949748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,256,power_law_1.01,0.07592960000038147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,256,power_law_1.01,0.07704960107803345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,256,power_law_1.2,0.07497599720954895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,256,power_law_1.2,0.0760703980922699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,32,balanced,0.12211733063062032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,32,balanced,0.1236853301525116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,32,power_law_1.01,0.11271040439605713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,32,power_law_1.01,0.1208191990852356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,32,power_law_1.2,0.11471999883651733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,32,power_law_1.2,0.11658240556716919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,4,balanced,0.5119253396987915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,4,balanced,0.5136053164800009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,4,power_law_1.01,0.4332736015319824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,4,power_law_1.01,0.4500415802001953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,4,power_law_1.2,0.45488638877868653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,4,power_law_1.2,0.4635647773742676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,64,balanced,0.10387733578681946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,64,balanced,0.10466133554776509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,64,power_law_1.01,0.10080000162124633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,64,power_law_1.01,0.10188159942626954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,64,power_law_1.2,0.09937279820442199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,64,power_law_1.2,0.101254403591156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,8,balanced,0.28280532360076904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,8,balanced,0.28536534309387207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,8,power_law_1.01,0.25144960880279543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,8,power_law_1.01,0.26124160289764403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,8,power_law_1.2,0.24375040531158448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,1,8,power_law_1.2,0.26309120655059814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,16,1,balanced,0.2052853306134542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,16,1,balanced,0.20704533656438193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,16,1,power_law_1.01,0.1619328022003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,16,1,power_law_1.01,0.16361600160598755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,16,1,power_law_1.2,0.1561792016029358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,16,1,power_law_1.2,0.1588863968849182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,2,1,balanced,0.9501226743062338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,2,1,balanced,0.9520426591237386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,2,1,power_law_1.01,0.6878911972045898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,2,1,power_law_1.01,0.6907519817352294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,2,1,power_law_1.2,0.680179214477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,2,1,power_law_1.2,0.6822912216186523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,4,1,balanced,0.5452693303426107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,4,1,balanced,0.545578678448995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,4,1,power_law_1.01,0.401632022857666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,4,1,power_law_1.01,0.4022208213806152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,4,1,power_law_1.2,0.3990400075912476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,4,1,power_law_1.2,0.399072003364563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,8,1,balanced,0.34109334150950116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,8,1,balanced,0.35202133655548096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,8,1,power_law_1.01,0.24275200366973876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,8,1,power_law_1.01,0.24325120449066162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,8,1,power_law_1.2,0.2360703945159912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,256,8,1,power_law_1.2,0.23892478942871093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,1,balanced,2.712042808532715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,1,balanced,2.7160959243774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,1,power_law_1.01,1.3886655807495116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,1,power_law_1.01,1.3985919952392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,1,power_law_1.2,1.2591872215270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,1,power_law_1.2,1.293331241607666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,128,balanced,0.10029866298039754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,128,balanced,0.10148266951243083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,128,power_law_1.01,0.0973695993423462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,128,power_law_1.01,0.0998080015182495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,128,power_law_1.2,0.09488639831542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,128,power_law_1.2,0.09619839787483216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,16,balanced,0.2481706738471985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,16,balanced,0.2550506591796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,16,power_law_1.01,0.21232640743255615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,16,power_law_1.01,0.21429119110107422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,16,power_law_1.2,0.19534080028533934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,16,power_law_1.2,0.22747519016265869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,2,balanced,1.3865866661071777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,2,balanced,1.3877174059549968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,2,power_law_1.01,0.7630591869354248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,2,power_law_1.01,0.8066176414489746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,2,power_law_1.2,0.7575104236602783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,2,power_law_1.2,0.7747327804565429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,32,balanced,0.14662399888038635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,32,balanced,0.14844266573588052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,32,power_law_1.01,0.1356160044670105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,32,power_law_1.01,0.13649280071258546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,32,power_law_1.2,0.12748160362243652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,32,power_law_1.2,0.1348863959312439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,4,balanced,0.7363786697387695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,4,balanced,0.736687978108724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,4,power_law_1.01,0.478931188583374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,4,power_law_1.01,0.5043903827667237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,4,power_law_1.2,0.45626239776611327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,4,power_law_1.2,0.5442240238189697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,64,balanced,0.1141813298066457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,64,balanced,0.1172160009543101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,64,power_law_1.01,0.10561920404434204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,64,power_law_1.01,0.10996479988098144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,64,power_law_1.2,0.10340479612350464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,64,power_law_1.2,0.10849920511245728
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,8,balanced,0.39833064874013263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,8,balanced,0.40053868293762207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,8,power_law_1.01,0.33956480026245117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,8,power_law_1.01,0.35174400806427003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,8,power_law_1.2,0.38455040454864503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,1,8,power_law_1.2,0.3997056007385254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,16,1,balanced,0.3099199930826823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,16,1,balanced,0.31799999872843426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,16,1,power_law_1.01,0.17449599504470825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,16,1,power_law_1.01,0.1756991982460022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,16,1,power_law_1.2,0.16255999803543092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,16,1,power_law_1.2,0.1633344054222107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,2,1,balanced,1.3940906524658203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,2,1,balanced,1.3954025904337566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,2,1,power_law_1.01,0.7330751895904541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,2,1,power_law_1.01,0.7515135765075683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,2,1,power_law_1.2,0.6779263973236084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,2,1,power_law_1.2,0.6881663799285889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,4,1,balanced,0.7865119775136312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,4,1,balanced,0.7869013150533041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,4,1,power_law_1.01,0.41648001670837403
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,4,1,power_law_1.01,0.4255360126495361
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,4,1,power_law_1.2,0.39574398994445803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,4,1,power_law_1.2,0.39967999458312986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,8,1,balanced,0.4485386610031128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,8,1,balanced,0.45099735260009766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,8,1,power_law_1.01,0.27066240310668943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,8,1,power_law_1.01,0.2761087894439697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,8,1,power_law_1.2,0.2637376070022583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,48,7168,2048,8,384,8,1,power_law_1.2,0.26545279026031493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,1,balanced,0.25273066759109497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,1,balanced,0.2530720035235087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,1,power_law_1.01,0.27859199047088623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,1,power_law_1.01,0.2789184093475342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,1,power_law_1.2,0.28190720081329346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,1,power_law_1.2,0.2820096015930176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,128,balanced,0.07530133426189423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,128,balanced,0.07544533411661784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,128,power_law_1.01,0.07585279941558838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,128,power_law_1.01,0.07858560085296631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,128,power_law_1.2,0.07913600206375122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,128,power_law_1.2,0.07916799783706666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,16,balanced,0.08853333195050557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,16,balanced,0.08901333808898926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,16,power_law_1.01,0.08984320163726807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,16,power_law_1.01,0.09086719751358033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,16,power_law_1.2,0.09150720238685608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,16,power_law_1.2,0.09258880019187928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,2,balanced,0.16873067617416382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,2,balanced,0.1691733400026957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,2,power_law_1.01,0.18958719968795776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,2,power_law_1.01,0.1898368000984192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,2,power_law_1.2,0.19363199472427367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,2,power_law_1.2,0.1942528009414673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,32,balanced,0.07961066563924153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,32,balanced,0.08044800162315369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,32,power_law_1.01,0.08043519854545593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,32,power_law_1.01,0.08258559703826904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,32,power_law_1.2,0.08380159735679626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,32,power_law_1.2,0.08565760254859925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,4,balanced,0.1273973286151886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,4,balanced,0.12826133767763773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,4,power_law_1.01,0.13219840526580812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,4,power_law_1.01,0.13338880538940429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,4,power_law_1.2,0.13448959589004517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,4,power_law_1.2,0.13511680364608764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,64,balanced,0.07665066421031952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,64,balanced,0.07774400214354198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,64,power_law_1.01,0.07946239709854126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,64,power_law_1.01,0.07951359748840332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,64,power_law_1.2,0.07962239980697632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,64,power_law_1.2,0.07994239926338195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,8,balanced,0.09707732995351155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,8,balanced,0.09739200274149577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,8,power_law_1.01,0.10638079643249512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,8,power_law_1.01,0.10936319828033447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,8,power_law_1.2,0.11178239583969116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,1,8,power_law_1.2,0.11185920238494873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,2,1,balanced,0.15692800283432007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,2,1,balanced,0.15769599874814352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,2,1,power_law_1.01,0.17766400575637817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,2,1,power_law_1.01,0.17864320278167725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,2,1,power_law_1.2,0.17917439937591553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,2048,768,8,128,2,1,power_law_1.2,0.18263039588928223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,1,balanced,1.0919146537780762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,1,balanced,1.0930720170338948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,1,power_law_1.01,1.030675220489502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,1,power_law_1.01,1.0367615699768067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,1,power_law_1.2,1.0839360237121582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,1,power_law_1.2,1.106982421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,128,balanced,0.14798933267593384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,128,balanced,0.14818666378657022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,128,power_law_1.01,0.14824960231781006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,128,power_law_1.01,0.14975359439849853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,128,power_law_1.2,0.1518720030784607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,128,power_law_1.2,0.1525056004524231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,16,balanced,0.20354666312535605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,16,balanced,0.20356800158818564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,16,power_law_1.01,0.20499839782714843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,16,power_law_1.01,0.20879359245300294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,16,power_law_1.2,0.20618879795074463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,16,power_law_1.2,0.21152639389038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,2,balanced,0.6276373465855917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,2,balanced,0.6291199922561646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,2,power_law_1.01,0.60033278465271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,2,power_law_1.01,0.6063488006591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,2,power_law_1.2,0.6234176158905029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,2,power_law_1.2,0.6353151798248291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,256,balanced,0.14148267110188803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,256,balanced,0.14389333128929138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,256,power_law_1.01,0.14536960124969484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,256,power_law_1.01,0.14570879936218262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,256,power_law_1.2,0.14708479642868041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,256,power_law_1.2,0.14956799745559693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,32,balanced,0.17123732964197794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,32,balanced,0.17222400506337485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,32,power_law_1.01,0.1729856014251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,32,power_law_1.01,0.17858560085296632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,32,power_law_1.2,0.1790336012840271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,32,power_law_1.2,0.18090239763259888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,4,balanced,0.39345065752665204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,4,balanced,0.39372265338897705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,4,power_law_1.01,0.38404479026794436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,4,power_law_1.01,0.39486079216003417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,4,power_law_1.2,0.3931583881378174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,4,power_law_1.2,0.3957567930221558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,64,balanced,0.15519466996192932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,64,balanced,0.1563146710395813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,64,power_law_1.01,0.15694719552993774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,64,power_law_1.01,0.15724159479141236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,64,power_law_1.2,0.15837440490722657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,64,power_law_1.2,0.16454399824142457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,8,balanced,0.26869332790374756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,8,balanced,0.2691253423690796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,8,power_law_1.01,0.2698303937911987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,8,power_law_1.01,0.27005441188812257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,8,power_law_1.2,0.27929599285125734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,1,8,power_law_1.2,0.28170878887176515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,2,1,balanced,0.614682674407959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,2,1,balanced,0.6156320174535116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,2,1,power_law_1.01,0.5741824150085449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,2,1,power_law_1.01,0.5899839878082276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,2,1,power_law_1.2,0.6012159824371338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,2,1,power_law_1.2,0.6032832145690918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,4,1,balanced,0.3747466802597046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,4,1,balanced,0.37597866853078205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,4,1,power_law_1.01,0.3513407945632935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,4,1,power_law_1.01,0.3555327892303467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,4,1,power_law_1.2,0.358022403717041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,3072,1536,8,256,4,1,power_law_1.2,0.36729600429534914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,1,balanced,0.841925303141276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,1,balanced,0.8431893189748129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,1,power_law_1.01,1.0413567543029785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,1,power_law_1.01,1.0539456367492677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,1,power_law_1.2,1.0442048072814942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,1,power_law_1.2,1.0589887619018554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,2,balanced,0.5039199988047282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,2,balanced,0.5051519870758057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,2,power_law_1.01,0.7364352226257325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,2,power_law_1.01,0.7391295909881592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,2,power_law_1.2,0.7310848236083984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,2,power_law_1.2,0.7338943958282471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,4,balanced,0.38708265622456867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,4,balanced,0.3874613444010417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,4,power_law_1.01,0.5889088153839112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,4,power_law_1.01,0.6204415798187256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,4,power_law_1.2,0.5468736171722413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,4,power_law_1.2,0.5827072143554688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,8,balanced,0.3272586663564046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,8,balanced,0.3276960055033366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,8,power_law_1.01,0.45937280654907225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,8,power_law_1.01,0.4665855884552002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,8,power_law_1.2,0.4548992156982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,1,8,power_law_1.2,0.4654528141021729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,16,1,balanced,0.09574400385220845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,16,1,balanced,0.0972160001595815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,16,1,power_law_1.01,0.10403200387954711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,16,1,power_law_1.01,0.10487680435180664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,16,1,power_law_1.2,0.10410239696502685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,16,1,power_law_1.2,0.11003520488739013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,2,1,balanced,0.4538079897562663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,2,1,balanced,0.4540319840113322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,2,1,power_law_1.01,0.5409535884857177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,2,1,power_law_1.01,0.5410624027252198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,2,1,power_law_1.2,0.5430784225463867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,2,1,power_law_1.2,0.5479551792144776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,4,1,balanced,0.2627573410669963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,4,1,balanced,0.26338134209314984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,4,1,power_law_1.01,0.29933440685272217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,4,1,power_law_1.01,0.304640007019043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,4,1,power_law_1.2,0.2931135892868042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,4,1,power_law_1.2,0.2936255931854248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,8,1,balanced,0.15230400363604227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,8,1,balanced,0.1536960005760193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,8,1,power_law_1.01,0.1738368034362793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,8,1,power_law_1.01,0.17893120050430297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,8,1,power_law_1.2,0.16701439619064332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,14336,2,8,8,1,power_law_1.2,0.17280639410018922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,1,balanced,0.7636853059132894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,1,balanced,0.7646293640136719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,1,power_law_1.01,0.8688703536987304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,1,power_law_1.01,0.8783488273620605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,1,power_law_1.2,0.8976192474365234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,1,power_law_1.2,0.9033408164978027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,128,balanced,0.14313066999117532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,128,balanced,0.14330666263898215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,128,power_law_1.01,0.14421119689941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,128,power_law_1.01,0.14484479427337646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,128,power_law_1.2,0.14733439683914185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,128,power_law_1.2,0.14945919513702394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,16,balanced,0.16389866669972739
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,16,balanced,0.16454933087031046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,16,power_law_1.01,0.19366400241851806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,16,power_law_1.01,0.19440000057220458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,16,power_law_1.2,0.19818240404129028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,16,power_law_1.2,0.20448639392852783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,2,balanced,0.46701331933339435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,2,balanced,0.4676213264465332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,2,power_law_1.01,0.5180736064910889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,2,power_law_1.01,0.5269248008728027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,2,power_law_1.2,0.5425151824951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,2,power_law_1.2,0.5483327865600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,32,balanced,0.1527359982331594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,32,balanced,0.15312533577283224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,32,power_law_1.01,0.15808000564575195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,32,power_law_1.01,0.1597632050514221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,32,power_law_1.2,0.16396160125732423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,32,power_law_1.2,0.16870399713516235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,4,balanced,0.2922293345133464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,4,balanced,0.29229867458343506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,4,power_law_1.01,0.3322367906570435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,4,power_law_1.01,0.34022400379180906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,4,power_law_1.2,0.34189438819885254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,4,power_law_1.2,0.3469311952590942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,64,balanced,0.14410133163134256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,64,balanced,0.14659200112024942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,64,power_law_1.01,0.14810240268707275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,64,power_law_1.01,0.1490623950958252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,64,power_law_1.2,0.15077760219573974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,64,power_law_1.2,0.15312000513076782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,8,balanced,0.2164426644643148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,8,balanced,0.21793067455291748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,8,power_law_1.01,0.24431359767913818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,8,power_law_1.01,0.24451839923858643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,8,power_law_1.2,0.2529920101165771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,1,8,power_law_1.2,0.25575039386749265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,2,1,balanced,0.44635732968648273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,2,1,balanced,0.447157343228658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,2,1,power_law_1.01,0.49022722244262695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,2,1,power_law_1.01,0.4917312145233154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,2,1,power_law_1.2,0.4959424018859863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,2,1,power_law_1.2,0.496230411529541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,4,1,balanced,0.2712693413098653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,4,1,balanced,0.272544006506602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,4,1,power_law_1.01,0.3126271963119507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,4,1,power_law_1.01,0.31491200923919677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,4,1,power_law_1.2,0.3162048101425171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,1536,8,128,4,1,power_law_1.2,0.31775360107421874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,1,balanced,4.763855934143066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,1,balanced,4.768581390380859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,1,power_law_1.01,4.906118392944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,1,power_law_1.01,4.94189453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,1,power_law_1.2,5.106502532958984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,1,power_law_1.2,5.15296630859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,128,balanced,0.4941279888153076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,128,balanced,0.49450135231018066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,128,power_law_1.01,0.5152063846588135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,128,power_law_1.01,0.5173056125640869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,128,power_law_1.2,0.5253312110900878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,128,power_law_1.2,0.5276031970977784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,16,balanced,0.7399733066558838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,16,balanced,0.7416586875915527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,16,power_law_1.01,0.7801599979400635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,16,power_law_1.01,0.7803775787353515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,16,power_law_1.2,0.8054271697998047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,16,power_law_1.2,0.8077312469482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,2,balanced,2.637946605682373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,2,balanced,2.639824072519938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,2,power_law_1.01,2.7250751495361327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,2,power_law_1.01,2.7623807907104494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,2,power_law_1.2,2.7987648010253907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,2,power_law_1.2,2.8582271575927733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,256,balanced,0.4751360019048055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,256,balanced,0.4774880011876424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,256,power_law_1.01,0.491315221786499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,256,power_law_1.01,0.4922304153442383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,256,power_law_1.2,0.5006912231445313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,256,power_law_1.2,0.5028480052947998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,32,balanced,0.6005653142929077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,32,balanced,0.6007146835327148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,32,power_law_1.01,0.6296832084655761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,32,power_law_1.01,0.6297728061676026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,32,power_law_1.2,0.6426496028900146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,32,power_law_1.2,0.645414400100708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,4,balanced,1.558245340983073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,4,balanced,1.5610987345377605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,4,power_law_1.01,1.618227195739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,4,power_law_1.01,1.624684715270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,4,power_law_1.2,1.6345024108886719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,4,power_law_1.2,1.6678464889526368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,64,balanced,0.5310986836751302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,64,balanced,0.5342293183008829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,64,power_law_1.01,0.5466752052307129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,64,power_law_1.01,0.5533760070800782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,64,power_law_1.2,0.5610752105712891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,64,power_law_1.2,0.5643136024475097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,8,balanced,1.0185919602711995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,8,balanced,1.0196906725565593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,8,power_law_1.01,1.0636159896850585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,8,power_law_1.01,1.0687744140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,8,power_law_1.2,1.1037631988525392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,4096,2688,22,512,1,8,power_law_1.2,1.1101247787475585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,1,balanced,1.3242932955423992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,1,balanced,1.325173298517863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,1,power_law_1.01,1.6352575302124024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,1,power_law_1.01,1.659993553161621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,1,power_law_1.2,1.600998306274414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,1,power_law_1.2,1.6464448928833009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,2,balanced,0.8174880345662435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,2,balanced,0.8183200359344482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,2,power_law_1.01,1.119212818145752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,2,power_law_1.01,1.1317503929138184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,2,power_law_1.2,1.0781696319580079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,2,power_law_1.2,1.2067839622497558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,4,balanced,0.5072319904963175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,4,balanced,0.5082826614379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,4,power_law_1.01,0.7695551872253418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,4,power_law_1.01,0.8298368453979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,4,power_law_1.2,0.9353471755981445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,4,power_law_1.2,0.9528384208679199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,8,balanced,0.406549334526062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,8,balanced,0.40677332878112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,8,power_law_1.01,0.7155776023864746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,8,power_law_1.01,0.7653823852539062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,8,power_law_1.2,0.7565311908721923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,1,8,power_law_1.2,0.7600192070007324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,16,1,balanced,0.13395200173060098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,16,1,balanced,0.13524799545605978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,16,1,power_law_1.01,0.18748799562454224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,16,1,power_law_1.01,0.1899072051048279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,16,1,power_law_1.2,0.1893952012062073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,16,1,power_law_1.2,0.18951679468154908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,2,1,balanced,0.684063990910848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,2,1,balanced,0.6852746804555258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,2,1,power_law_1.01,0.857260799407959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,2,1,power_law_1.01,0.857868766784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,2,1,power_law_1.2,0.8582528114318848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,2,1,power_law_1.2,0.8742015838623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,32,1,balanced,0.11473066608111064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,32,1,balanced,0.1159946620464325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,32,1,power_law_1.01,0.11921919584274292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,32,1,power_law_1.01,0.12055039405822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,32,1,power_law_1.2,0.11996159553527833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,32,1,power_law_1.2,0.12004480361938477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,4,1,balanced,0.3895466725031535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,4,1,balanced,0.39033599694569904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,4,1,power_law_1.01,0.4637887954711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,4,1,power_law_1.01,0.4658944129943848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,4,1,power_law_1.2,0.46343679428100587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,4,1,power_law_1.2,0.46387200355529784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,8,1,balanced,0.21994666258494058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,8,1,balanced,0.22012799978256226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,8,1,power_law_1.01,0.2792191982269287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,8,1,power_law_1.01,0.27985920906066897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,8,1,power_law_1.2,0.2799936056137085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,16384,2,8,8,1,power_law_1.2,0.28115200996398926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,1,balanced,2.661658604939779
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,1,balanced,2.662207921346029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,1,power_law_1.01,2.5196672439575196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,1,power_law_1.01,2.5523775100708006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,1,power_law_1.2,2.6639551162719726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,1,power_law_1.2,2.694713592529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,128,balanced,0.23389333486557007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,128,balanced,0.2339573303858439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,128,power_law_1.01,0.2392319917678833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,128,power_law_1.01,0.24161279201507568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,128,power_law_1.2,0.2467519998550415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,128,power_law_1.2,0.24757759571075438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,16,balanced,0.3741919994354248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,16,balanced,0.37673600514729816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,16,power_law_1.01,0.3828288078308105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,16,power_law_1.01,0.39130239486694335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,16,power_law_1.2,0.3939519882202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,16,power_law_1.2,0.4004032135009766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,2,balanced,1.4506079355875652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,2,balanced,1.451584021250407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,2,power_law_1.01,1.384934425354004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,2,power_law_1.01,1.399238395690918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,2,power_law_1.2,1.4248640060424804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,2,power_law_1.2,1.452608013153076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,256,balanced,0.22605333725611368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,256,balanced,0.22629332542419434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,256,power_law_1.01,0.2296447992324829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,256,power_law_1.01,0.23066239356994628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,256,power_law_1.2,0.23519361019134521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,256,power_law_1.2,0.23644800186157228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,32,balanced,0.2967413266499837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,32,balanced,0.29767467578252155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,32,power_law_1.01,0.3027776002883911
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,32,power_law_1.01,0.30883839130401614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,32,power_law_1.2,0.3131455898284912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,32,power_law_1.2,0.31948161125183105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,4,balanced,0.8435093561808268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,4,balanced,0.8439306418100992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,4,power_law_1.01,0.8217087745666504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,4,power_law_1.01,0.8363712310791016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,4,power_law_1.2,0.8422400474548339
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,4,power_law_1.2,0.8684415817260742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,64,balanced,0.25276799996693927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,64,balanced,0.2529653310775757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,64,power_law_1.01,0.26382720470428467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,64,power_law_1.01,0.2649983882904053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,64,power_law_1.2,0.27130880355834963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,64,power_law_1.2,0.2764863967895508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,8,balanced,0.5290559927622477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,8,balanced,0.5299626588821411
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,8,power_law_1.01,0.5253119945526123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,8,power_law_1.01,0.5432767868041992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,8,power_law_1.2,0.5357247829437256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,1,8,power_law_1.2,0.5468607902526855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,16,1,balanced,0.37970133622487384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,16,1,balanced,0.3812853495279948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,16,1,power_law_1.01,0.37183361053466796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,16,1,power_law_1.01,0.37256319522857667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,16,1,power_law_1.2,0.374617600440979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,16,1,power_law_1.2,0.3838848114013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,2,1,balanced,1.4268800417582195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,2,1,balanced,1.4271413485209148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,2,1,power_law_1.01,1.3836223602294921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,2,1,power_law_1.01,1.383743953704834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,2,1,power_law_1.2,1.4385600090026855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,2,1,power_law_1.2,1.4468031883239747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,4,1,balanced,0.5892906586329142
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,4,1,balanced,0.5899146795272827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,4,1,power_law_1.01,0.6335552215576172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,4,1,power_law_1.01,0.6364799976348877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,4,1,power_law_1.2,0.661900806427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,4,1,power_law_1.2,0.6787263870239257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,8,1,balanced,0.3475840091705322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,8,1,balanced,0.3480159838994344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,8,1,power_law_1.01,0.3542655944824219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,8,1,power_law_1.01,0.3564863920211792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,8,1,power_law_1.2,0.3613312005996704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2048,8,256,8,1,power_law_1.2,0.36136319637298586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,1,balanced,2.1316426595052085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,1,balanced,2.131744066874186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,1,power_law_1.01,2.316531181335449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,1,power_law_1.01,2.338617515563965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,1,power_law_1.2,2.362387275695801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,1,power_law_1.2,2.408857536315918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,16,balanced,0.32280532519022626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,16,balanced,0.32318933804829914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,16,power_law_1.01,0.3726016044616699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,16,power_law_1.01,0.38135039806365967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,16,power_law_1.2,0.38480000495910643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,16,power_law_1.2,0.3868096113204956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,2,balanced,1.1735946337382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,2,balanced,1.1741866270701091
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,2,power_law_1.01,1.2771903991699218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,2,power_law_1.01,1.3007807731628418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,2,power_law_1.2,1.3052224159240722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,2,power_law_1.2,1.3363519668579102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,32,balanced,0.2573546568552653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,32,balanced,0.25915199518203735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,32,power_law_1.01,0.30090880393981934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,32,power_law_1.01,0.3010879993438721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,32,power_law_1.2,0.31083519458770753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,32,power_law_1.2,0.3206847906112671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,4,balanced,0.6909759839375814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,4,balanced,0.6935466925303141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,4,power_law_1.01,0.743884801864624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,4,power_law_1.01,0.7720128059387207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,4,power_law_1.2,0.7800384044647217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,4,power_law_1.2,0.8056575775146484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,8,balanced,0.44651198387145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,8,balanced,0.446613351504008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,8,power_law_1.01,0.4886911869049072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,8,power_law_1.01,0.4910399913787842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,8,power_law_1.2,0.504204797744751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,1,8,power_law_1.2,0.5114687919616699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,2,1,balanced,1.13919997215271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,2,1,balanced,1.1410026550292969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,2,1,power_law_1.01,1.2490176200866698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,2,1,power_law_1.01,1.2512191772460937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,2,1,power_law_1.2,1.2658687591552735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,2,1,power_law_1.2,1.2927871704101563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,4,1,balanced,0.4875466823577881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,4,1,balanced,0.4882986545562744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,4,1,power_law_1.01,0.6315455913543702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,4,1,power_law_1.01,0.6412864208221436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,4,1,power_law_1.2,0.656928014755249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,6144,2560,8,160,4,1,power_law_1.2,0.6580927848815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,1,balanced,3.094282786051432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,1,balanced,3.0959787368774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,1,power_law_1.01,2.9177791595458986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,1,power_law_1.01,2.9425535202026367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,1,power_law_1.2,3.036992073059082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,1,power_law_1.2,3.042176055908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,128,balanced,0.25938133398691815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,128,balanced,0.26156266530354816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,128,power_law_1.01,0.26673920154571534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,128,power_law_1.01,0.26698238849639894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,128,power_law_1.2,0.27256319522857664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,128,power_law_1.2,0.27387518882751466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,16,balanced,0.42083199818929035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,16,balanced,0.42164798577626544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,16,power_law_1.01,0.4353663921356201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,16,power_law_1.01,0.4392384052276611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,16,power_law_1.2,0.45866241455078127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,16,power_law_1.2,0.4587264060974121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,2,balanced,1.6759519577026367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,2,power_law_1.01,1.6251327514648437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,2,power_law_1.01,1.669715118408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,2,power_law_1.2,1.6617855072021483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,2,power_law_1.2,1.6751935958862305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,256,balanced,0.25516800085703534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,256,balanced,0.25521065791447956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,256,power_law_1.01,0.25527679920196533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,256,power_law_1.01,0.2556544065475464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,256,power_law_1.2,0.25899519920349123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,256,power_law_1.2,0.26041600704193113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,32,balanced,0.32822932799657184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,32,balanced,0.328384002049764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,32,power_law_1.01,0.3441087961196899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,32,power_law_1.01,0.34858880043029783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,32,power_law_1.2,0.35952000617980956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,32,power_law_1.2,0.3596352100372314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,4,balanced,0.9662559827168783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,4,balanced,0.966480016708374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,4,power_law_1.01,0.9367424011230469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,4,power_law_1.01,0.9433407783508301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,4,power_law_1.2,0.9752896308898926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,4,power_law_1.2,0.977337646484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,64,balanced,0.2794453303019206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,64,balanced,0.2809866666793823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,64,power_law_1.01,0.289849591255188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,64,power_law_1.01,0.291264009475708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,64,power_law_1.2,0.29780480861663816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,64,power_law_1.2,0.3016000032424927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,8,balanced,0.6023039817810059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,8,balanced,0.6028266747792562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,8,power_law_1.01,0.6113152027130127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,8,power_law_1.01,0.6132224082946778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,8,power_law_1.2,0.6206655979156495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,1,8,power_law_1.2,0.6491968154907226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,16,1,balanced,0.4396053155263265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,16,1,balanced,0.4399786790211995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,16,1,power_law_1.01,0.42335357666015627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,16,1,power_law_1.01,0.42904958724975584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,16,1,power_law_1.2,0.43648638725280764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,16,1,power_law_1.2,0.4376192092895508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,2,1,balanced,1.6590827306111653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,2,1,balanced,1.6595892906188965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,2,1,power_law_1.01,1.6018367767333985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,2,1,power_law_1.01,1.616543960571289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,2,1,power_law_1.2,1.6549568176269531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,2,1,power_law_1.2,1.6597183227539063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,4,1,balanced,0.6781973044077555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,4,1,balanced,0.6813386281331381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,4,1,power_law_1.01,0.7339968204498291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,4,1,power_law_1.01,0.7387455940246582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,4,1,power_law_1.2,0.7666175842285157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,4,1,power_law_1.2,0.7771455764770507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,8,1,balanced,0.38170135021209717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,8,1,balanced,0.3886559804280599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,8,1,power_law_1.01,0.4097599983215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,8,1,power_law_1.01,0.4128448009490967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,8,1,power_law_1.2,0.41651201248168945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,256,8,1,power_law_1.2,0.4189631938934326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,1,balanced,4.5403626759847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,1,balanced,4.544143994649251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,1,power_law_1.01,3.7990657806396486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,1,power_law_1.01,3.8536895751953124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,1,power_law_1.2,3.9865150451660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,1,power_law_1.2,4.017926406860352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,128,balanced,0.32208534081776935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,128,balanced,0.3223466674486796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,128,power_law_1.01,0.3214207887649536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,128,power_law_1.01,0.32238719463348386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,128,power_law_1.2,0.33087360858917236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,128,power_law_1.2,0.3310080051422119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,16,balanced,0.562554677327474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,16,balanced,0.5652586619059244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,16,power_law_1.01,0.5374271869659424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,16,power_law_1.01,0.5391104221343994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,16,power_law_1.2,0.5493375778198242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,16,power_law_1.2,0.5549248218536377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,2,balanced,2.4232959747314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,2,balanced,2.4250399271647134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,2,power_law_1.01,2.064959907531738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,2,power_law_1.01,2.0801279067993166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,2,power_law_1.2,2.0817024230957033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,2,power_law_1.2,2.165439987182617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,32,balanced,0.42909332116444904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,32,balanced,0.43053332964579266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,32,power_law_1.01,0.4186367988586426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,32,power_law_1.01,0.42423038482666015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,32,power_law_1.2,0.42091522216796873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,32,power_law_1.2,0.42946557998657225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,4,balanced,1.366480032602946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,4,balanced,1.3680960337320964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,4,power_law_1.01,1.2867648124694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,4,power_law_1.01,1.3036864280700684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,4,power_law_1.2,1.2195903778076171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,4,power_law_1.2,1.223731231689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,64,balanced,0.3577173153559367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,64,balanced,0.35865068435668945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,64,power_law_1.01,0.35101439952850344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,64,power_law_1.01,0.35304319858551025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,64,power_law_1.2,0.3635967969894409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,64,power_law_1.2,0.3663680076599121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,8,balanced,0.836837371190389
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,8,balanced,0.8368533452351888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,8,power_law_1.01,0.7396543979644775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,8,power_law_1.01,0.7606143951416016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,8,power_law_1.2,0.7935808181762696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,1,8,power_law_1.2,0.8171008110046387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,16,1,balanced,0.32941333452860516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,16,1,balanced,0.33294399579366046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,16,1,power_law_1.01,0.41338238716125486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,16,1,power_law_1.01,0.414137601852417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,16,1,power_law_1.2,0.41597437858581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,16,1,power_law_1.2,0.41841278076171873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,2,1,balanced,2.418224016825358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,2,1,balanced,2.4228533109029136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,2,1,power_law_1.01,2.0620479583740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,2,1,power_law_1.01,2.1098175048828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,2,1,power_law_1.2,2.1323968887329103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,2,1,power_law_1.2,2.1513343811035157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,4,1,balanced,1.3839680353800456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,4,1,balanced,1.386799971262614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,4,1,power_law_1.01,1.1732799530029296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,4,1,power_law_1.01,1.1964287757873535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,4,1,power_law_1.2,1.197606372833252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,4,1,power_law_1.2,1.2236672401428224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,8,1,balanced,0.5015893379847208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,8,1,balanced,0.5023039976755778
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,8,1,power_law_1.01,0.5203648090362549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,8,1,power_law_1.01,0.5240128040313721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,8,1,power_law_1.2,0.521017599105835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,512,7168,2048,8,384,8,1,power_law_1.2,0.5270336151123047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,1,balanced,1.2725760142008464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,1,balanced,1.2732319831848145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,1,power_law_1.01,1.3110079765319824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,1,power_law_1.01,1.311788845062256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,1,power_law_1.2,1.3085696220397949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,1,power_law_1.2,1.3091135978698731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,128,balanced,0.4818720022837321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,128,balanced,0.48212265968322754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,128,power_law_1.01,0.5286399841308593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,128,power_law_1.01,0.5391295909881592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,128,power_law_1.2,0.5665215969085693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,128,power_law_1.2,0.5731200218200684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,16,balanced,0.5337599913279215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,16,balanced,0.5340746641159058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,16,power_law_1.01,0.5986623764038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,16,power_law_1.01,0.6094399929046631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,16,power_law_1.2,0.6237696170806885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,16,power_law_1.2,0.6386047840118408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,2,balanced,0.9230720202128092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,2,balanced,0.9231999715169271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,2,power_law_1.01,1.008563232421875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,2,power_law_1.01,1.0139455795288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,2,power_law_1.2,0.9974911689758301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,2,power_law_1.2,1.0068032264709472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,32,balanced,0.5027146736780802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,32,balanced,0.5053333441416422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,32,power_law_1.01,0.5754752159118652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,32,power_law_1.01,0.5773888111114502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,32,power_law_1.2,0.5872000217437744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,32,power_law_1.2,0.6108672142028808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,4,balanced,0.6998026371002197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,4,balanced,0.6998773415883383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,4,power_law_1.01,0.7601791858673096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,4,power_law_1.01,0.7779967784881592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,4,power_law_1.2,0.7866496086120606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,4,power_law_1.2,0.8189311981201172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,64,balanced,0.48870400587717694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,64,balanced,0.48982401688893634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,64,power_law_1.01,0.554259204864502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,64,power_law_1.01,0.5572031974792481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,64,power_law_1.2,0.5746367931365967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,64,power_law_1.2,0.5834623813629151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,8,balanced,0.588101347287496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,8,balanced,0.5902400016784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,8,power_law_1.01,0.66211838722229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,8,power_law_1.01,0.6729152202606201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,8,power_law_1.2,0.683513593673706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,1,8,power_law_1.2,0.7027135848999023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,2,1,balanced,0.7864586512247721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,2,1,balanced,0.7873653570810953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,2,1,power_law_1.01,0.8157440185546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,2,1,power_law_1.01,0.8187071800231933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,2,1,power_law_1.2,0.813049602508545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,2048,768,8,128,2,1,power_law_1.2,0.8155008316040039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,1,balanced,3.2947680155436196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,1,balanced,3.2956107457478843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,1,power_law_1.01,3.7010112762451173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,1,power_law_1.01,3.721331024169922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,1,power_law_1.2,3.734630584716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,1,power_law_1.2,3.739411163330078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,128,balanced,0.8048053582509359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,128,balanced,0.8051733175913492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,128,power_law_1.01,0.9048576354980469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,128,power_law_1.01,0.9156415939331055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,128,power_law_1.2,0.9660415649414062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,128,power_law_1.2,0.9702655792236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,16,balanced,0.951861302057902
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,16,power_law_1.01,1.1081855773925782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,16,power_law_1.01,1.1367487907409668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,16,power_law_1.2,1.1765760421752929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,16,power_law_1.2,1.2025471687316895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,2,balanced,2.087813377380371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,2,balanced,2.089615980784098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,2,power_law_1.01,2.3343040466308596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,2,power_law_1.01,2.368044853210449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,2,power_law_1.2,2.3899839401245115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,2,power_law_1.2,2.463692855834961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,256,balanced,0.7950987021128336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,256,balanced,0.7951253255208334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,256,power_law_1.01,0.8602560043334961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,256,power_law_1.01,0.8659263610839844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,256,power_law_1.2,0.9317567825317383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,256,power_law_1.2,0.9375103950500489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,32,balanced,0.8690186341603597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,32,balanced,0.8691253662109375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,32,power_law_1.01,0.9883135795593262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,32,power_law_1.01,1.0055551528930664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,32,power_law_1.2,1.07706880569458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,32,power_law_1.2,1.0867903709411622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,4,balanced,1.439509391784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,4,balanced,1.441322644551595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,4,power_law_1.01,1.7111808776855468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,4,power_law_1.01,1.7315008163452148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,4,power_law_1.2,1.7252927780151368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,4,power_law_1.2,1.762726402282715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,64,balanced,0.827338695526123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,64,balanced,0.8285919825236002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,64,power_law_1.01,0.940492820739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,64,power_law_1.01,0.965824031829834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,64,power_law_1.2,0.9812159538269043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,64,power_law_1.2,0.999295997619629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,8,balanced,1.1159520149230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,8,balanced,1.1162559986114502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,8,power_law_1.01,1.2724608421325683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,8,power_law_1.01,1.3142080307006836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,8,power_law_1.2,1.3375935554504395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,1,8,power_law_1.2,1.3511232376098632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,2,1,balanced,1.8848053614298503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,2,1,balanced,1.8849973678588867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,2,1,power_law_1.01,2.089030456542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,2,1,power_law_1.01,2.100480079650879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,2,1,power_law_1.2,2.1030336380004884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,2,1,power_law_1.2,2.1127872467041016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,4,1,balanced,1.1643040180206299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,4,1,balanced,1.1658399899800618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,4,1,power_law_1.01,1.2799296379089355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,4,1,power_law_1.01,1.281043243408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,4,1,power_law_1.2,1.2868288040161133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,3072,1536,8,256,4,1,power_law_1.2,1.2892864227294922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,1,balanced,8.256863911946615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,1,balanced,8.257962544759115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,1,power_law_1.01,8.355347442626954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,1,power_law_1.01,8.369407653808594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,1,power_law_1.2,8.319750213623047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,1,power_law_1.2,8.373542022705077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,2,balanced,4.805055936177571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,2,balanced,4.806581179300944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,2,power_law_1.01,5.936620712280273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,2,power_law_1.01,6.425791931152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,2,power_law_1.2,6.005120086669922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,2,power_law_1.2,6.327967834472656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,4,balanced,3.0615574518839517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,4,balanced,3.065781275431315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,4,power_law_1.01,5.145996856689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,4,power_law_1.01,5.214400100708008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,4,power_law_1.2,5.618310546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,4,power_law_1.2,5.713286590576172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,8,balanced,2.123258590698242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,8,balanced,2.1241706212361655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,8,power_law_1.01,4.645087814331054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,8,power_law_1.01,4.679123306274414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,8,power_law_1.2,4.2277374267578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,1,8,power_law_1.2,4.620691299438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,16,1,balanced,0.6821173032124838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,16,1,balanced,0.6827466487884521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,16,1,power_law_1.01,0.6725247859954834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,16,1,power_law_1.01,0.6837056159973145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,16,1,power_law_1.2,0.6773568153381347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,16,1,power_law_1.2,0.6801023960113526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,2,1,balanced,4.169333457946777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,2,1,balanced,4.17146650950114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,2,1,power_law_1.01,4.153408050537109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,2,1,power_law_1.01,4.182419204711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,2,1,power_law_1.2,4.151833724975586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,2,1,power_law_1.2,4.159110260009766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,4,1,balanced,2.167301336924235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,4,1,balanced,2.171973387400309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,4,1,power_law_1.01,2.1511423110961916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,4,1,power_law_1.01,2.1553600311279295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,4,1,power_law_1.2,2.131180763244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,4,1,power_law_1.2,2.1414207458496093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,8,1,balanced,1.1624586582183838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,8,1,balanced,1.1628053188323975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,8,1,power_law_1.01,1.1541631698608399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,8,1,power_law_1.01,1.1568384170532227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,8,1,power_law_1.2,1.1412799835205079
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,14336,2,8,8,1,power_law_1.2,1.1453503608703612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,1,balanced,4.027125358581543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,1,balanced,4.031200091044108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,1,power_law_1.01,4.22081298828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,1,power_law_1.01,4.226675033569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,1,power_law_1.2,4.159161758422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,1,power_law_1.2,4.189209747314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,128,balanced,0.8793013095855713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,128,balanced,0.8811413447062174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,128,power_law_1.01,1.036128044128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,128,power_law_1.01,1.0423232078552247
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,128,power_law_1.2,1.182425594329834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,128,power_law_1.2,1.2017855644226074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,16,balanced,1.0613653659820557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,16,balanced,1.0628373622894287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,16,power_law_1.01,1.315129566192627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,16,power_law_1.01,1.3167360305786133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,16,power_law_1.2,1.3691328048706055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,16,power_law_1.2,1.439904022216797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,2,balanced,2.505018711090088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,2,balanced,2.506351947784424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,2,power_law_1.01,2.7591232299804687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,2,power_law_1.01,2.814201545715332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,2,power_law_1.2,2.7780736923217773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,2,power_law_1.2,2.867385673522949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,32,balanced,0.9569599628448486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,32,balanced,0.9607199827829996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,32,power_law_1.01,1.1844799995422364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,32,power_law_1.01,1.1998911857604981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,32,power_law_1.2,1.3093695640563965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,32,power_law_1.2,1.3783616065979003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,4,balanced,1.6825547218322754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,4,balanced,1.6856907208760579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,4,power_law_1.01,1.9649215698242188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,4,power_law_1.01,1.9817920684814454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,4,power_law_1.2,1.9757888793945313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,4,power_law_1.2,2.1422847747802733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,64,balanced,0.9067733287811279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,64,balanced,0.9077119827270508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,64,power_law_1.01,1.0619071960449218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,64,power_law_1.01,1.0829440116882325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,64,power_law_1.2,1.2491776466369628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,64,power_law_1.2,1.2796223640441895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,8,balanced,1.2718133131663005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,8,balanced,1.2728906472524006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,8,power_law_1.01,1.5013824462890626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,8,power_law_1.01,1.6061887741088867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,8,power_law_1.2,1.6531200408935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,1,8,power_law_1.2,1.7661760330200196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,2,1,balanced,2.2580693562825522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,2,1,balanced,2.266042709350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,2,1,power_law_1.01,2.310963249206543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,2,1,power_law_1.01,2.322368049621582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,2,1,power_law_1.2,2.309516716003418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,2,1,power_law_1.2,2.314553642272949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,4,1,balanced,1.404607931772868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,4,1,balanced,1.4047627449035645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,4,1,power_law_1.01,1.455948829650879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,4,1,power_law_1.01,1.4611328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,4,1,power_law_1.2,1.4488639831542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,1536,8,128,4,1,power_law_1.2,1.4527039527893066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,1,balanced,21.56678517659505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,1,balanced,21.569557189941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,1,power_law_1.01,20.494085693359374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,1,power_law_1.01,20.498150634765626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,1,power_law_1.2,20.45729217529297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,1,power_law_1.2,20.50235595703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,128,balanced,3.300352096557617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,128,balanced,3.3036746978759766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,128,power_law_1.01,3.6186431884765624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,128,power_law_1.01,3.724313735961914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,128,power_law_1.2,3.8174591064453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,128,power_law_1.2,3.918636703491211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,16,balanced,4.333461443583171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,16,balanced,4.339605331420898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,16,power_law_1.01,4.730105590820313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,16,power_law_1.01,5.003136062622071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,16,power_law_1.2,4.970150375366211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,16,power_law_1.2,5.180012893676758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,2,balanced,12.52456029256185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,2,balanced,12.525615692138672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,2,power_law_1.01,12.594137573242188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,2,power_law_1.01,12.6797119140625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,2,power_law_1.2,12.537312316894532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,2,power_law_1.2,12.97606964111328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,256,balanced,3.224735895792643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,256,balanced,3.2341814041137695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,256,power_law_1.01,3.4683456420898438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,256,power_law_1.01,3.5154750823974608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,256,power_law_1.2,3.693868637084961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,256,power_law_1.2,3.7397953033447267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,32,balanced,3.742645263671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,32,balanced,3.7445386250813804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,32,power_law_1.01,4.198233413696289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,32,power_law_1.01,4.246796798706055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,32,power_law_1.2,4.3992256164550785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,32,power_law_1.2,4.489484786987305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,4,balanced,7.852389017740886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,4,balanced,7.853765487670898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,4,power_law_1.01,8.09151382446289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,4,power_law_1.01,8.371340942382812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,4,power_law_1.2,8.382355499267579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,4,power_law_1.2,8.474208068847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,64,balanced,3.4472481409708657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,64,balanced,3.461941401163737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,64,power_law_1.01,3.810163116455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,64,power_law_1.01,3.8953536987304687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,64,power_law_1.2,4.02845458984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,64,power_law_1.2,4.202099227905274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,8,balanced,5.513343811035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,8,balanced,5.527946472167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,8,power_law_1.01,5.81275520324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,8,power_law_1.01,6.046131134033203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,8,power_law_1.2,6.282918548583984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,4096,2688,22,512,1,8,power_law_1.2,6.456134033203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,1,balanced,13.434762318929037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,1,balanced,13.43627675374349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,1,power_law_1.01,13.415303039550782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,1,power_law_1.01,13.421830749511718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,1,power_law_1.2,13.31461181640625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,1,power_law_1.2,13.350674438476563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,2,balanced,7.44268798828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,2,balanced,7.447477340698242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,2,power_law_1.01,10.340557098388672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,2,power_law_1.01,9.635897827148437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,2,power_law_1.2,10.056121826171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,2,power_law_1.2,10.491065979003906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,4,balanced,4.430074691772461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,4,balanced,4.435162544250488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,4,power_law_1.01,7.555654144287109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,4,power_law_1.01,8.190118408203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,4,power_law_1.2,7.503520202636719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,4,power_law_1.2,7.556082916259766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,8,balanced,2.9148693084716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,8,balanced,2.9184532165527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,8,power_law_1.01,6.910829162597656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,8,power_law_1.01,7.224575805664062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,8,power_law_1.2,6.763053131103516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,1,8,power_law_1.2,6.8232063293457035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,16,1,balanced,1.0870400269826253
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,16,1,balanced,1.0875840187072754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,16,1,power_law_1.01,1.059507179260254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,16,1,power_law_1.01,1.061638355255127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,16,1,power_law_1.2,1.056383991241455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,16,1,power_law_1.2,1.0644096374511718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,2,1,balanced,6.7318878173828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,2,1,balanced,6.744368235270183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,2,1,power_law_1.01,6.688179016113281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,2,1,power_law_1.01,6.731858825683593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,2,1,power_law_1.2,6.718412780761719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,2,1,power_law_1.2,6.720928192138672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,32,1,balanced,0.6939893563588461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,32,1,balanced,0.6976640224456787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,32,1,power_law_1.01,0.6788864135742188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,32,1,power_law_1.01,0.6823488235473633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,32,1,power_law_1.2,0.6789055824279785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,32,1,power_law_1.2,0.6908991813659668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,4,1,balanced,3.501925468444824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,4,1,balanced,3.5031038920084634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,4,1,power_law_1.01,3.4924991607666014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,4,1,power_law_1.01,3.4945919036865236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,4,1,power_law_1.2,3.4687873840332033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,4,1,power_law_1.2,3.485753631591797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,8,1,balanced,1.8914027214050293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,8,1,balanced,1.8933226267496746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,8,1,power_law_1.01,1.8612672805786132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,8,1,power_law_1.01,1.8719104766845702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,8,1,power_law_1.2,1.8612480163574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,16384,2,8,8,1,power_law_1.2,1.8671039581298827
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,1,balanced,7.72978146870931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,1,balanced,7.737599690755208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,1,power_law_1.01,8.864364624023438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,1,power_law_1.01,8.873772430419923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,1,power_law_1.2,8.973715209960938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,1,power_law_1.2,9.009043121337891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,128,balanced,1.2797013123830159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,128,balanced,1.2837920188903809
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,128,power_law_1.01,1.5272064208984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,128,power_law_1.01,1.5459903717041015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,128,power_law_1.2,1.6591232299804688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,128,power_law_1.2,1.6834495544433594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,16,balanced,1.6526400248209636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,16,balanced,1.6601759592692058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,16,power_law_1.01,2.0423871994018556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,16,power_law_1.01,2.096396827697754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,16,power_law_1.2,2.1329792022705076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,16,power_law_1.2,2.3268800735473634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,2,balanced,4.57154655456543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,2,balanced,4.57530148824056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,2,power_law_1.01,5.347046279907227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,2,power_law_1.01,5.550431823730468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,2,power_law_1.2,5.542623901367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,2,power_law_1.2,5.758835220336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,256,balanced,1.2544053395589192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,256,balanced,1.255786657333374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,256,power_law_1.01,1.4462592124938964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,256,power_law_1.01,1.4551168441772462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,256,power_law_1.2,1.5967679977416993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,256,power_law_1.2,1.5977343559265136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,32,balanced,1.442266623179118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,32,balanced,1.443178653717041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,32,power_law_1.01,1.7444927215576171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,32,power_law_1.01,1.7636159896850585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,32,power_law_1.2,1.980659294128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,32,power_law_1.2,1.9849855422973632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,4,balanced,2.9126294453938804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,4,balanced,2.9159412384033203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,4,power_law_1.01,3.4854591369628904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,4,power_law_1.01,3.5425342559814452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,4,power_law_1.2,3.6626815795898438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,4,power_law_1.2,3.9589054107666017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,64,balanced,1.3337279955546062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,64,balanced,1.338314692179362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,64,power_law_1.01,1.6158208847045898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,64,power_law_1.01,1.6465343475341796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,64,power_law_1.2,1.8003263473510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,64,power_law_1.2,1.8112319946289062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,8,balanced,2.0129013061523438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,8,balanced,2.014245351155599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,8,power_law_1.01,2.4703807830810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,8,power_law_1.01,2.472761535644531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,8,power_law_1.2,2.6241472244262694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,1,8,power_law_1.2,2.682521629333496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,16,1,balanced,1.3346400260925293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,16,1,balanced,1.3365707397460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,16,1,power_law_1.01,1.4402688026428223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,16,1,power_law_1.01,1.4422911643981933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,16,1,power_law_1.2,1.445126438140869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,16,1,power_law_1.2,1.4523008346557618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,2,1,balanced,4.266463915506999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,2,1,balanced,4.271317481994629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,2,1,power_law_1.01,4.854668807983399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,2,1,power_law_1.01,4.8558910369873045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,2,1,power_law_1.2,4.871641540527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,2,1,power_law_1.2,4.884979248046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,4,1,balanced,2.474720001220703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,4,1,balanced,2.4747680028279624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,4,1,power_law_1.01,2.785145568847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,4,1,power_law_1.01,2.786092758178711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,4,1,power_law_1.2,2.816806411743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,4,1,power_law_1.2,2.818252754211426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,8,1,balanced,3.3633600870768228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,8,1,balanced,3.366522789001465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,8,1,power_law_1.01,3.564998245239258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,8,1,power_law_1.01,3.5658817291259766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,8,1,power_law_1.2,3.5802753448486326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2048,8,256,8,1,power_law_1.2,3.5853950500488283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,1,balanced,9.531930923461914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,1,balanced,9.545183817545572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,1,power_law_1.01,10.065203094482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,1,power_law_1.01,10.075161743164063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,1,power_law_1.2,10.011833953857423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,1,power_law_1.2,10.073983764648437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,16,balanced,1.8670719464619954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,16,balanced,1.8701440493265789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,16,power_law_1.01,2.4166015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,16,power_law_1.01,2.427680015563965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,16,power_law_1.2,2.517190361022949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,16,power_law_1.2,2.783008003234863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,2,balanced,5.530783971150716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,2,balanced,5.530810674031575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,2,power_law_1.01,6.255583953857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,2,power_law_1.01,6.437625885009766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,2,power_law_1.2,6.246246337890625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,2,power_law_1.2,6.304806518554687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,32,balanced,1.5959146817525227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,32,balanced,1.597061316172282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,32,power_law_1.01,2.078860855102539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,32,power_law_1.01,2.126515197753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,32,power_law_1.2,2.267206382751465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,32,power_law_1.2,2.3537216186523438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,4,balanced,3.347562789916992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,4,balanced,3.34931214650472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,4,power_law_1.01,3.9384193420410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,4,power_law_1.01,4.034553527832031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,4,power_law_1.2,3.992812728881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,4,power_law_1.2,4.225964736938477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,8,balanced,2.3401974042256675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,8,balanced,2.3404480616251626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,8,power_law_1.01,2.881657600402832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,8,power_law_1.01,2.958451271057129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,8,power_law_1.2,3.053049659729004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,1,8,power_law_1.2,3.2418239593505858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,2,1,balanced,5.195573488871257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,2,1,balanced,5.196330706278483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,2,1,power_law_1.01,5.4264575958251955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,2,1,power_law_1.01,5.448992156982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,2,1,power_law_1.2,5.38397445678711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,2,1,power_law_1.2,5.408691024780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,4,1,balanced,2.9696105321248374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,4,1,balanced,2.972544034322103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,4,1,power_law_1.01,3.0212991714477537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,4,1,power_law_1.01,3.0381696701049803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,4,1,power_law_1.2,3.013030433654785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,6144,2560,8,160,4,1,power_law_1.2,3.025062370300293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,1,balanced,8.912405649820963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,1,balanced,8.915557225545248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,1,power_law_1.01,10.259136199951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,1,power_law_1.01,10.28572769165039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,1,power_law_1.2,10.377401733398438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,1,power_law_1.2,10.421126556396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,128,balanced,1.3869706789652507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,128,balanced,1.3909707069396973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,128,power_law_1.01,1.6283456802368164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,128,power_law_1.01,1.6574527740478515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,128,power_law_1.2,1.813382339477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,128,power_law_1.2,1.8438911437988281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,16,balanced,1.8254613876342773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,16,balanced,1.826757272084554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,16,power_law_1.01,2.234623908996582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,16,power_law_1.01,2.258790397644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,16,power_law_1.2,2.4388608932495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,16,power_law_1.2,2.628416061401367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,2,balanced,5.22925345102946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,2,balanced,5.236293474833171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,2,power_law_1.01,6.0908161163330075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,2,power_law_1.01,6.1647998809814455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,2,power_law_1.2,6.219449615478515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,2,power_law_1.2,6.338399887084961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,256,balanced,1.3572319348653157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,256,balanced,1.3607734044392903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,256,power_law_1.01,1.576531219482422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,256,power_law_1.01,1.616966438293457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,256,power_law_1.2,1.790297508239746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,256,power_law_1.2,1.7928192138671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,32,balanced,1.577605406443278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,32,balanced,1.5785600344340007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,32,power_law_1.01,1.9765119552612305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,32,power_law_1.01,1.9999040603637694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,32,power_law_1.2,2.1905792236328123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,32,power_law_1.2,2.204217529296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,4,balanced,3.288895924886068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,4,balanced,3.292405446370443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,4,power_law_1.01,3.9934017181396486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,4,power_law_1.01,4.09681282043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,4,power_law_1.2,4.344800186157227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,4,power_law_1.2,4.395603179931641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,64,balanced,1.4527360598246257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,64,balanced,1.4571839968363445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,64,power_law_1.01,1.7939071655273438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,64,power_law_1.01,1.8306751251220703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,64,power_law_1.2,1.9713407516479493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,64,power_law_1.2,2.0038848876953126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,8,balanced,2.2359946568806968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,8,balanced,2.238272031148275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,8,power_law_1.01,2.7940223693847654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,8,power_law_1.01,2.841708755493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,8,power_law_1.2,3.073740768432617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,1,8,power_law_1.2,3.2050945281982424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,16,1,balanced,1.538922627766927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,16,1,balanced,1.539669354756673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,16,1,power_law_1.01,1.6607488632202148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,16,1,power_law_1.01,1.6619199752807616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,16,1,power_law_1.2,1.664896011352539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,16,1,power_law_1.2,1.6674688339233399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,2,1,balanced,4.932554562886556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,2,1,balanced,4.937040011088054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,2,1,power_law_1.01,5.6226238250732425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,2,1,power_law_1.01,5.63267822265625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,2,1,power_law_1.2,5.645619201660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,2,1,power_law_1.2,5.653228759765625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,4,1,balanced,2.8361600240071616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,4,1,balanced,2.836432139078776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,4,1,power_law_1.01,3.2115966796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,4,1,power_law_1.01,3.2168960571289062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,4,1,power_law_1.2,3.241068649291992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,4,1,power_law_1.2,3.2532543182373046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,8,1,balanced,3.903648058573405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,8,1,balanced,3.907642682393392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,8,1,power_law_1.01,4.151756668090821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,8,1,power_law_1.01,4.154950332641602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,8,1,power_law_1.2,4.151968002319336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,256,8,1,power_law_1.2,4.157779312133789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,1,balanced,9.190661112467447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,1,balanced,9.193573633829752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,1,power_law_1.01,11.221177673339843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,1,power_law_1.01,11.223538970947265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,1,power_law_1.2,11.553119659423828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,1,power_law_1.2,11.57729263305664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,128,balanced,1.4460639953613281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,128,balanced,1.4468266169230144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,128,power_law_1.01,1.68035831451416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,128,power_law_1.01,1.7053312301635741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,128,power_law_1.2,1.7698623657226562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,128,power_law_1.2,1.8668415069580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,16,balanced,1.8947839736938477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,16,balanced,1.8978187243143718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,16,power_law_1.01,2.3116479873657227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,16,power_law_1.01,2.3385408401489256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,16,power_law_1.2,2.371379280090332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,16,power_law_1.2,2.570867156982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,2,balanced,5.397194544474284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,2,balanced,5.399685541788737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,2,power_law_1.01,6.640179443359375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,2,power_law_1.01,6.810643005371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,2,power_law_1.2,7.059014129638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,2,power_law_1.2,7.059059143066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,32,balanced,1.6416106224060059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,32,balanced,1.644368012746175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,32,power_law_1.01,2.0122432708740234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,32,power_law_1.01,2.0308095932006838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,32,power_law_1.2,2.084671974182129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,32,power_law_1.2,2.1862016677856446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,4,balanced,3.3974345525105796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,4,balanced,3.406266530354818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,4,power_law_1.01,4.212575912475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,4,power_law_1.01,4.2680000305175785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,4,power_law_1.2,4.428012847900391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,4,power_law_1.2,4.510348892211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,64,balanced,1.5108960469563801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,64,balanced,1.5145492553710938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,64,power_law_1.01,1.7822912216186524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,64,power_law_1.01,1.7921279907226562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,64,power_law_1.2,1.9608448028564454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,64,power_law_1.2,2.0182464599609373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,8,balanced,2.3978880246480307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,8,balanced,2.399376074473063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,8,power_law_1.01,2.997222328186035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,8,power_law_1.01,3.010553550720215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,8,power_law_1.2,3.1748607635498045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,1,8,power_law_1.2,3.2793983459472655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,16,1,balanced,1.7763627370198567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,16,1,balanced,1.7774559656778972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,16,1,power_law_1.01,1.9293376922607421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,16,1,power_law_1.01,1.9326143264770508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,16,1,power_law_1.2,1.9624191284179688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,16,1,power_law_1.2,1.971219253540039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,2,1,balanced,5.082858721415202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,2,1,balanced,5.085386594136556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,2,1,power_law_1.01,6.134527969360351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,2,1,power_law_1.01,6.182534408569336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,2,1,power_law_1.2,6.287871932983398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,2,1,power_law_1.2,6.342796707153321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,4,1,balanced,3.0483039220174155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,4,1,balanced,3.053701400756836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,4,1,power_law_1.01,3.6066558837890623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,4,1,power_law_1.01,3.6197566986083984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,4,1,power_law_1.2,3.692006301879883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,4,1,power_law_1.2,3.700908660888672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,8,1,balanced,2.032965342203776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,8,1,balanced,2.035535971323649
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,8,1,power_law_1.01,2.331385612487793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,8,1,power_law_1.01,2.3454208374023438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,8,1,power_law_1.2,2.400422477722168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,6144,7168,2048,8,384,8,1,power_law_1.2,2.4004287719726562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,1,balanced,0.14153066277503967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,1,balanced,0.1420799990495046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,1,power_law_1.01,0.1329408049583435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,1,power_law_1.01,0.13523839712142943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,1,power_law_1.2,0.1359295964241028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,1,power_law_1.2,0.13648639917373656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,128,balanced,0.0394400010506312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,128,balanced,0.04160533348719279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,128,power_law_1.01,0.03870719969272614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,128,power_law_1.01,0.03880960047245026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,128,power_law_1.2,0.03866879940032959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,128,power_law_1.2,0.03895680010318756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,16,balanced,0.043525333205858864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,16,balanced,0.04401599864164988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,16,power_law_1.01,0.04239999949932098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,16,power_law_1.01,0.04266240000724793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,16,power_law_1.2,0.04227199852466583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,16,power_law_1.2,0.04293760061264038
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,2,balanced,0.09688533345858256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,2,balanced,0.09876799583435059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,2,power_law_1.01,0.09217919707298279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,2,power_law_1.01,0.0930624008178711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,2,power_law_1.2,0.09313920140266418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,2,power_law_1.2,0.0936959981918335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,32,balanced,0.03982399900754293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,32,balanced,0.041797334949175514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,32,power_law_1.01,0.038848000764846805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,32,power_law_1.01,0.03966720104217529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,32,power_law_1.2,0.039340800046920775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,32,power_law_1.2,0.039417600631713866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,4,balanced,0.06559466818968455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,4,balanced,0.0661653329928716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,4,power_law_1.01,0.06261759996414185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,4,power_law_1.01,0.06289920210838318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,4,power_law_1.2,0.062041598558425906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,4,power_law_1.2,0.06281599998474122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,64,balanced,0.03944533318281174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,64,balanced,0.03984533250331879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,64,power_law_1.01,0.03866879940032959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,64,power_law_1.01,0.0387584000825882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,64,power_law_1.2,0.03883520066738129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,64,power_law_1.2,0.038848000764846805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,8,balanced,0.0554666668176651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,8,balanced,0.05619733532269796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,8,power_law_1.01,0.05000320076942444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,8,power_law_1.01,0.05238400101661682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,8,power_law_1.2,0.052774399518966675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,1,8,power_law_1.2,0.05286399722099304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,2,1,balanced,0.09974933664004008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,2,1,balanced,0.10051733255386353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,2,1,power_law_1.01,0.09123839735984803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,2,1,power_law_1.01,0.09404799938201905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,2,1,power_law_1.2,0.09349120259284974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,2048,768,8,128,2,1,power_law_1.2,0.09499520063400269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,1,balanced,0.6206186612447103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,1,balanced,0.6207679907480875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,1,power_law_1.01,0.47655677795410156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,1,power_law_1.01,0.47817602157592776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,1,power_law_1.2,0.465715217590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,1,power_law_1.2,0.47655038833618163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,128,balanced,0.05380799869696299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,128,balanced,0.055861334005991616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,128,power_law_1.01,0.0520576000213623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,128,power_law_1.01,0.05245440006256104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,128,power_law_1.2,0.05235199928283692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,128,power_law_1.2,0.0525056004524231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,16,balanced,0.08235733211040497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,16,balanced,0.08237866560618083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,16,power_law_1.01,0.07651839852333069
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,16,power_law_1.01,0.07820159792900086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,16,power_law_1.2,0.07614719867706299
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,16,power_law_1.2,0.07697280049324036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,2,balanced,0.3421333233515422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,2,balanced,0.34700266520182294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,2,power_law_1.01,0.2783679962158203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,2,power_law_1.01,0.28659839630126954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,2,power_law_1.2,0.26103041172027586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,2,power_law_1.2,0.2911936044692993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,256,balanced,0.05154666801293691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,256,balanced,0.05208533505598704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,256,power_law_1.01,0.0507968008518219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,256,power_law_1.01,0.05085440278053284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,256,power_law_1.2,0.05111680030822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,256,power_law_1.2,0.05200639963150024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,32,balanced,0.07214933137098949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,32,balanced,0.07331199944019318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,32,power_law_1.01,0.06481279730796814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,32,power_law_1.01,0.06936960220336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,32,power_law_1.2,0.06704000234603882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,32,power_law_1.2,0.06877440214157104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,4,balanced,0.19549334049224854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,4,balanced,0.19584532578786215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,4,power_law_1.01,0.16762239933013917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,4,power_law_1.01,0.1843840003013611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,4,power_law_1.2,0.15711359977722167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,4,power_law_1.2,0.1751871943473816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,64,balanced,0.059061333537101746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,64,balanced,0.059749335050582886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,64,power_law_1.01,0.057004797458648684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,64,power_law_1.01,0.05736320018768311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,64,power_law_1.2,0.05588480234146118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,64,power_law_1.2,0.057081598043441775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,8,balanced,0.12916266918182373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,8,balanced,0.13077333569526672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,8,power_law_1.01,0.11626240015029907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,8,power_law_1.01,0.11782399415969849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,8,power_law_1.2,0.10974080562591552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,1,8,power_law_1.2,0.11793919801712036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,2,1,balanced,0.3369866609573364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,2,1,balanced,0.3373440106709798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,2,1,power_law_1.01,0.2635456085205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,2,1,power_law_1.01,0.2663104057312012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,2,1,power_law_1.2,0.25770881175994875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,2,1,power_law_1.2,0.2612031936645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,4,1,balanced,0.2058346668879191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,4,1,balanced,0.20587199926376343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,4,1,power_law_1.01,0.16261759996414185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,4,1,power_law_1.01,0.16319359540939332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,4,1,power_law_1.2,0.16128640174865722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,3072,1536,8,256,4,1,power_law_1.2,0.1619328022003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,1,balanced,0.30532799164454144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,1,balanced,0.309168001015981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,1,power_law_1.01,0.33350400924682616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,1,power_law_1.01,0.3355135917663574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,1,power_law_1.2,0.33511040210723875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,1,power_law_1.2,0.3362943887710571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,2,balanced,0.20887466271718344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,2,balanced,0.21462933222452799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,2,power_law_1.01,0.23664638996124268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,2,power_law_1.01,0.2564800024032593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,2,power_law_1.2,0.23790719509124755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,2,power_law_1.2,0.2513344049453735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,4,balanced,0.16195199886957803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,4,balanced,0.16265066464742026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,4,power_law_1.01,0.19414399862289428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,4,power_law_1.01,0.20286719799041747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,4,power_law_1.2,0.19533439874649047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,4,power_law_1.2,0.21013119220733642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,8,balanced,0.1514026621977488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,8,balanced,0.15185067057609558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,8,power_law_1.01,0.16733440160751342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,8,power_law_1.01,0.17063679695129394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,8,power_law_1.2,0.17085440158843995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,1,8,power_law_1.2,0.17339520454406737
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,16,1,balanced,0.05382933219273885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,16,1,balanced,0.05407466491063436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,16,1,power_law_1.01,0.054201602935791016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,16,1,power_law_1.01,0.05432320237159729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,16,1,power_law_1.2,0.05586559772491455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,16,1,power_law_1.2,0.057062399387359616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,2,1,balanced,0.17018665870030722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,2,1,balanced,0.17063466707865396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,2,1,power_law_1.01,0.18849920034408568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,2,1,power_law_1.01,0.1887295961380005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,2,1,power_law_1.2,0.18928639888763427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,2,1,power_law_1.2,0.19054720401763917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,4,1,balanced,0.09970133503278096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,4,1,balanced,0.10227732857068379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,4,1,power_law_1.01,0.11687040328979492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,4,1,power_law_1.01,0.11706240177154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,4,1,power_law_1.2,0.11655679941177369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,4,1,power_law_1.2,0.11667840480804444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,8,1,balanced,0.07205866773923238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,8,1,balanced,0.07246933380762736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,8,1,power_law_1.01,0.07530879974365234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,8,1,power_law_1.01,0.07612800002098083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,8,1,power_law_1.2,0.07592960000038147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,14336,2,8,8,1,power_law_1.2,0.07652480006217957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,1,balanced,0.4312533140182495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,1,balanced,0.43251200517018634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,1,power_law_1.01,0.3827455997467041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,1,power_law_1.01,0.38718719482421876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,1,power_law_1.2,0.4042623996734619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,1,power_law_1.2,0.4070847988128662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,128,balanced,0.05575466652711233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,128,balanced,0.05741333464781443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,128,power_law_1.01,0.05560320019721985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,128,power_law_1.01,0.0568448007106781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,128,power_law_1.2,0.058220797777175905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,128,power_law_1.2,0.05863680243492127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,16,balanced,0.08171733220418294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,16,balanced,0.08196266492207845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,16,power_law_1.01,0.07863680124282837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,16,power_law_1.01,0.07991679906845092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,16,power_law_1.2,0.08088319897651672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,16,power_law_1.2,0.08261759877204895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,2,balanced,0.24553066492080688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,2,balanced,0.2465546727180481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,2,power_law_1.01,0.2279871940612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,2,power_law_1.01,0.23475840091705322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,2,power_law_1.2,0.23399679660797118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,2,power_law_1.2,0.2392512083053589
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,32,balanced,0.06737599770228068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,32,balanced,0.0706826647122701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,32,power_law_1.01,0.06637439727783204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,32,power_law_1.01,0.06659200191497802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,32,power_law_1.2,0.06624000072479248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,32,power_law_1.2,0.06997759938240052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,4,balanced,0.15403200189272562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,4,balanced,0.15822399655977884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,4,power_law_1.01,0.14594559669494628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,4,power_law_1.01,0.15287679433822632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,4,power_law_1.2,0.14538880586624145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,4,power_law_1.2,0.152128005027771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,64,balanced,0.0584746648867925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,64,balanced,0.06055466830730438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,64,power_law_1.01,0.05775359869003296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,64,power_law_1.01,0.05829120278358459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,64,power_law_1.2,0.062003201246261595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,64,power_law_1.2,0.06318719983100891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,8,balanced,0.0940106709798177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,8,balanced,0.09522133072217305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,8,power_law_1.01,0.0908415973186493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,8,power_law_1.01,0.09118080139160156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,8,power_law_1.2,0.08894079923629761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,1,8,power_law_1.2,0.09134079813957215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,2,1,balanced,0.24037333329518637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,2,1,balanced,0.24232532580693564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,2,1,power_law_1.01,0.22652800083160402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,2,1,power_law_1.01,0.22657279968261718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,2,1,power_law_1.2,0.22597761154174806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,2,1,power_law_1.2,0.22818560600280763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,4,1,balanced,0.15990933775901794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,4,1,balanced,0.16146666804949442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,4,1,power_law_1.01,0.15058560371398927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,4,1,power_law_1.01,0.15088000297546386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,4,1,power_law_1.2,0.15237760543823242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,1536,8,128,4,1,power_law_1.2,0.15239039659500123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,1,balanced,2.7681760787963867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,1,balanced,2.771162668863932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,1,power_law_1.01,2.2485376358032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,1,power_law_1.01,2.249062347412109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,1,power_law_1.2,2.255308723449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,1,power_law_1.2,2.2609472274780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,128,balanced,0.10466133554776509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,128,balanced,0.10523733496665955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,128,power_law_1.01,0.1012992024421692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,128,power_law_1.01,0.10371199846267701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,128,power_law_1.2,0.10187519788742065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,128,power_law_1.2,0.10448000431060792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,16,balanced,0.2537066737810771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,16,balanced,0.2558506727218628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,16,power_law_1.01,0.22232959270477295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,16,power_law_1.01,0.23180160522460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,16,power_law_1.2,0.21542398929595946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,16,power_law_1.2,0.22593278884887696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,2,balanced,1.4036906560262044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,2,balanced,1.4048266410827637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,2,power_law_1.01,1.1867136001586913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,2,power_law_1.01,1.2163200378417969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,2,power_law_1.2,1.1818047523498536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,2,power_law_1.2,1.2041343688964843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,256,balanced,0.09264533718427022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,256,balanced,0.09715732932090759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,256,power_law_1.01,0.09128320217132568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,256,power_law_1.01,0.09267839789390564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,256,power_law_1.2,0.09146239757537841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,256,power_law_1.2,0.09435520172119141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,32,balanced,0.16766399145126343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,32,balanced,0.17137600978215536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,32,power_law_1.01,0.15391360521316527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,32,power_law_1.01,0.15714559555053711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,32,power_law_1.2,0.15449600219726561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,32,power_law_1.2,0.1561792016029358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,4,balanced,0.7454186280568441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,4,balanced,0.7475093205769857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,4,power_law_1.01,0.6335872173309326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,4,power_law_1.01,0.6510784149169921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,4,power_law_1.2,0.6304831981658936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,4,power_law_1.2,0.6464704036712646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,64,balanced,0.11672533551851909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,64,balanced,0.11756267150243123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,64,power_law_1.01,0.11226880550384521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,64,power_law_1.01,0.11484800577163697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,64,power_law_1.2,0.11269760131835938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,64,power_law_1.2,0.1134335994720459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,8,balanced,0.41307199001312256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,8,balanced,0.41325334707895917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,8,power_law_1.01,0.35226879119873045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,8,power_law_1.01,0.39755520820617674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,8,power_law_1.2,0.36097919940948486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,4096,2688,22,512,1,8,power_law_1.2,0.3616192102432251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,1,balanced,0.4671413501103719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,1,balanced,0.46927467981974286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,1,power_law_1.01,0.5296127796173096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,1,power_law_1.01,0.5392767906188964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,1,power_law_1.2,0.49103360176086425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,1,power_law_1.2,0.5234496116638183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,2,balanced,0.3179253339767456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,2,balanced,0.3218986590703328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,2,power_law_1.01,0.34922239780426023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,2,power_law_1.01,0.36034560203552246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,2,power_law_1.2,0.34875519275665284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,2,power_law_1.2,0.3554752111434937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,4,balanced,0.21690666675567627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,4,balanced,0.22049599885940552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,4,power_law_1.01,0.28194561004638674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,4,power_law_1.01,0.3033792018890381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,4,power_law_1.2,0.28552320003509524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,4,power_law_1.2,0.30264959335327146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,8,balanced,0.19174933433532715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,8,balanced,0.19338132937749228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,8,power_law_1.01,0.2265023946762085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,8,power_law_1.01,0.25776000022888185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,8,power_law_1.2,0.23197441101074218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,1,8,power_law_1.2,0.2416896104812622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,16,1,balanced,0.07467733323574066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,16,1,balanced,0.07506133119265239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,16,1,power_law_1.01,0.07649279832839966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,16,1,power_law_1.01,0.07694079875946044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,16,1,power_law_1.2,0.07482879757881164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,16,1,power_law_1.2,0.07822719812393189
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,2,1,balanced,0.24807467063268027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,2,1,balanced,0.2510880033175151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,2,1,power_law_1.01,0.2771392107009888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,2,1,power_law_1.01,0.2911168098449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,2,1,power_law_1.2,0.27498879432678225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,2,1,power_law_1.2,0.28743040561676025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,32,1,balanced,0.05952000121275584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,32,1,balanced,0.062128002444903054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,32,1,power_law_1.01,0.060115200281143186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,32,1,power_law_1.01,0.061887997388839724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,32,1,power_law_1.2,0.060755199193954466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,32,1,power_law_1.2,0.0611840009689331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,4,1,balanced,0.14152533809343973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,4,1,balanced,0.15152532855669656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,4,1,power_law_1.01,0.16590720415115356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,4,1,power_law_1.01,0.17072000503540039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,4,1,power_law_1.2,0.17412480115890502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,4,1,power_law_1.2,0.17534079551696777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,8,1,balanced,0.09491200248400371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,8,1,balanced,0.09650666515032451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,8,1,power_law_1.01,0.10517760515213012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,8,1,power_law_1.01,0.10521600246429444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,8,1,power_law_1.2,0.1041599988937378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,16384,2,8,8,1,power_law_1.2,0.10590720176696777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,1,balanced,1.5669600168863933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,1,balanced,1.5760639508565266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,1,power_law_1.01,1.193619155883789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,1,power_law_1.01,1.2553919792175292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,1,power_law_1.2,1.1629631996154786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,1,power_law_1.2,1.1984319686889648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,128,balanced,0.08443199594815572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,128,balanced,0.08448533217112224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,128,power_law_1.01,0.08567039966583252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,128,power_law_1.01,0.08599039912223816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,128,power_law_1.2,0.08036479949951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,128,power_law_1.2,0.08140159845352173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,16,balanced,0.15213867028554282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,16,balanced,0.1525706648826599
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,16,power_law_1.01,0.1410048007965088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,16,power_law_1.01,0.1410688042640686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,16,power_law_1.2,0.1380031943321228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,16,power_law_1.2,0.1453760027885437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,2,balanced,0.8172533512115479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,2,balanced,0.8191200097401937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,2,power_law_1.01,0.6595392227172852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,2,power_law_1.01,0.6903168201446533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,2,power_law_1.2,0.663481616973877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,2,power_law_1.2,0.674067211151123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,256,balanced,0.07380799949169159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,256,balanced,0.07481066882610321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,256,power_law_1.01,0.0720255970954895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,256,power_law_1.01,0.07494400143623352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,256,power_law_1.2,0.07160320281982421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,256,power_law_1.2,0.07311360239982605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,32,balanced,0.11024533708890279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,32,balanced,0.11152533690134685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,32,power_law_1.01,0.1044927954673767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,32,power_law_1.01,0.10543999671936036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,32,power_law_1.2,0.1029695987701416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,32,power_law_1.2,0.10401920080184937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,4,balanced,0.4488106568654378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,4,balanced,0.44992534319559735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,4,power_law_1.01,0.36620159149169923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,4,power_law_1.01,0.37939839363098143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,4,power_law_1.2,0.355948805809021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,4,power_law_1.2,0.37944319248199465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,64,balanced,0.09513066212336223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,64,balanced,0.09770133097966512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,64,power_law_1.01,0.08944640159606934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,64,power_law_1.01,0.09255040287971497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,64,power_law_1.2,0.09433599710464477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,64,power_law_1.2,0.09590399861335755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,8,balanced,0.24810133377710977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,8,balanced,0.24888000885645548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,8,power_law_1.01,0.23582079410552978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,8,power_law_1.01,0.24175360202789306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,8,power_law_1.2,0.22990078926086427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,1,8,power_law_1.2,0.23264639377593993
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,16,1,balanced,0.1816906730333964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,16,1,balanced,0.1822133262952169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,16,1,power_law_1.01,0.14829440116882325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,16,1,power_law_1.01,0.14933120012283324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,16,1,power_law_1.2,0.14588160514831544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,16,1,power_law_1.2,0.14895360469818114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,2,1,balanced,0.8053812980651855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,2,1,balanced,0.8092532952626547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,2,1,power_law_1.01,0.62325119972229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,2,1,power_law_1.01,0.6308544158935547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,2,1,power_law_1.2,0.6072319984436035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,2,1,power_law_1.2,0.6253952026367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,4,1,balanced,0.45469868183135986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,4,1,balanced,0.45828266938527423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,4,1,power_law_1.01,0.3461440086364746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,4,1,power_law_1.01,0.35507841110229493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,4,1,power_law_1.2,0.34897279739379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,4,1,power_law_1.2,0.36126079559326174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,8,1,balanced,0.30524800221125287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,8,1,balanced,0.31354133288065594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,8,1,power_law_1.01,0.21872639656066895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,8,1,power_law_1.01,0.22087039947509765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,8,1,power_law_1.2,0.21717119216918945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2048,8,256,8,1,power_law_1.2,0.21921920776367188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,1,balanced,1.2438720067342122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,1,balanced,1.2492160002390544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,1,power_law_1.01,1.0686400413513184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,1,power_law_1.01,1.0706944465637207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,1,power_law_1.2,1.0628735542297363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,1,power_law_1.2,1.1086336135864259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,16,balanced,0.12748799721399942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,16,balanced,0.12880000472068787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,16,power_law_1.01,0.12360320091247559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,16,power_law_1.01,0.12540160417556762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,16,power_law_1.2,0.12091519832611083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,16,power_law_1.2,0.12338559627532959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,2,balanced,0.6635946830113729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,2,balanced,0.6663839817047119
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,2,power_law_1.01,0.5678207874298096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,2,power_law_1.01,0.5787136077880859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,2,power_law_1.2,0.5884031772613525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,2,power_law_1.2,0.5966527938842774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,32,balanced,0.1113813320795695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,32,balanced,0.11152533690134685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,32,power_law_1.01,0.1059648036956787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,32,power_law_1.01,0.10725120306015015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,32,power_law_1.2,0.10583679676055908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,32,power_law_1.2,0.1085312008857727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,4,balanced,0.36424001057942706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,4,balanced,0.3646453221638997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,4,power_law_1.01,0.3290623903274536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,4,power_law_1.01,0.33724160194396974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,4,power_law_1.2,0.3214591979980469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,4,power_law_1.2,0.3324160099029541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,8,balanced,0.2450986703236898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,8,balanced,0.24516799052556357
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,8,power_law_1.01,0.22546560764312745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,8,power_law_1.01,0.23066239356994628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,8,power_law_1.2,0.22076799869537353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,1,8,power_law_1.2,0.22935678958892822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,2,1,balanced,0.6579733292261759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,2,1,balanced,0.6583946545918783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,2,1,power_law_1.01,0.5595967769622803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,2,1,power_law_1.01,0.5697728157043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,2,1,power_law_1.2,0.5691264152526856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,2,1,power_law_1.2,0.5731647968292236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,4,1,balanced,0.35892268021901447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,4,1,balanced,0.35955198605855304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,4,1,power_law_1.01,0.3229952096939087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,4,1,power_law_1.01,0.3286207914352417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,4,1,power_law_1.2,0.32357120513916016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,6144,2560,8,160,4,1,power_law_1.2,0.33131520748138427
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,1,balanced,1.830933411916097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,1,balanced,1.8508480389912922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,1,power_law_1.01,1.3999744415283204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,1,power_law_1.01,1.4142720222473144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,1,power_law_1.2,1.3849535942077638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,1,power_law_1.2,1.3999168395996093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,128,balanced,0.09136000275611877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,128,balanced,0.09682666261990865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,128,power_law_1.01,0.08634880185127258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,128,power_law_1.01,0.09258880019187928
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,128,power_law_1.2,0.09191039800643921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,128,power_law_1.2,0.09422079920768738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,16,balanced,0.16746666034062704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,16,balanced,0.1679733395576477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,16,power_law_1.01,0.15470720529556276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,16,power_law_1.01,0.1570688009262085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,16,power_law_1.2,0.15671679973602295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,16,power_law_1.2,0.15733120441436768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,2,balanced,0.9508480230967203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,2,balanced,0.9528640111287435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,2,power_law_1.01,0.7415103912353516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,2,power_law_1.01,0.7748095989227295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,2,power_law_1.2,0.7597631931304931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,2,power_law_1.2,0.7650368213653564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,256,balanced,0.07902400195598602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,256,balanced,0.08482133348782857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,256,power_law_1.01,0.07690240144729614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,256,power_law_1.01,0.08136320114135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,256,power_law_1.2,0.07857919931411743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,256,power_law_1.2,0.07982720136642456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,32,balanced,0.12501333157221475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,32,balanced,0.12574932972590128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,32,power_law_1.01,0.11918720006942748
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,32,power_law_1.01,0.12050559520721435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,32,power_law_1.2,0.12098560333251954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,32,power_law_1.2,0.12121599912643433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,4,balanced,0.5162026484807333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,4,balanced,0.5167040030161539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,4,power_law_1.01,0.4199359893798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,4,power_law_1.01,0.47124481201171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,4,power_law_1.2,0.41947522163391116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,4,power_law_1.2,0.44197759628295896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,64,balanced,0.10501866539319356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,64,balanced,0.10925867160161336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,64,power_law_1.01,0.1021183967590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,64,power_law_1.01,0.10727039575576783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,64,power_law_1.2,0.10414079427719117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,64,power_law_1.2,0.10487680435180664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,8,balanced,0.2866026759147644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,8,balanced,0.288485328356425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,8,power_law_1.01,0.2636415958404541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,8,power_law_1.01,0.26419839859008787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,8,power_law_1.2,0.24344959259033203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,1,8,power_law_1.2,0.2573568105697632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,16,1,balanced,0.2076693375905355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,16,1,balanced,0.20807466904322305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,16,1,power_law_1.01,0.16648319959640503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,16,1,power_law_1.01,0.16876159906387328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,16,1,power_law_1.2,0.16441600322723388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,16,1,power_law_1.2,0.16512000560760498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,2,1,balanced,0.9532639980316162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,2,1,balanced,0.9549226760864258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,2,1,power_law_1.01,0.7379839897155762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,2,1,power_law_1.01,0.7493504047393799
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,2,1,power_law_1.2,0.7139711856842041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,2,1,power_law_1.2,0.7525568008422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,4,1,balanced,0.5290079911549886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,4,1,balanced,0.5292693376541138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,4,1,power_law_1.01,0.406009578704834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,4,1,power_law_1.01,0.4157567977905273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,4,1,power_law_1.2,0.40490241050720216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,4,1,power_law_1.2,0.40840959548950195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,8,1,balanced,0.33980266253153485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,8,1,balanced,0.34095998605092365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,8,1,power_law_1.01,0.24574720859527588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,8,1,power_law_1.01,0.25365118980407714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,8,1,power_law_1.2,0.24759039878845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,256,8,1,power_law_1.2,0.2487231969833374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,1,balanced,2.7143093744913735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,1,balanced,2.7508532206217446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,1,power_law_1.01,1.8243711471557618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,1,power_law_1.01,1.8458240509033204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,1,power_law_1.2,1.749830436706543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,1,power_law_1.2,1.7835071563720704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,128,balanced,0.09996267159779866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,128,balanced,0.10199466347694397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,128,power_law_1.01,0.0991104006767273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,128,power_law_1.01,0.10165120363235473
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,128,power_law_1.2,0.10077439546585083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,128,power_law_1.2,0.10459519624710083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,16,balanced,0.2508959968884786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,16,balanced,0.255568007628123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,16,power_law_1.01,0.21827199459075927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,16,power_law_1.01,0.22236158847808837
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,16,power_law_1.2,0.18757760524749756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,16,power_law_1.2,0.2106112003326416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,2,balanced,1.3934027353922527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,2,balanced,1.3947200775146484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,2,power_law_1.01,0.9851584434509277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,2,power_law_1.01,1.0570624351501465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,2,power_law_1.2,0.9465727806091309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,2,power_law_1.2,0.9836223602294922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,32,balanced,0.14866666992505392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,32,balanced,0.14962666233380637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,32,power_law_1.01,0.1338368058204651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,32,power_law_1.01,0.13700480461120607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,32,power_law_1.2,0.13475199937820434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,32,power_law_1.2,0.13944319486618043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,4,balanced,0.7395626703898112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,4,balanced,0.7397226492563883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,4,power_law_1.01,0.5881919860839844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,4,power_law_1.01,0.6027455806732178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,4,power_law_1.2,0.5813439846038818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,4,power_law_1.2,0.5952127933502197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,64,balanced,0.11291733384132385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,64,balanced,0.11705600221951802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,64,power_law_1.01,0.11101440191268921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,64,power_law_1.01,0.1120959997177124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,64,power_law_1.2,0.11431039571762085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,64,power_law_1.2,0.12007679939270019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,8,balanced,0.40037866433461505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,8,balanced,0.4009866714477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,8,power_law_1.01,0.3797951936721802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,8,power_law_1.01,0.40006399154663086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,8,power_law_1.2,0.3343424081802368
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,1,8,power_law_1.2,0.3701888084411621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,16,1,balanced,0.3115680019060771
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,16,1,balanced,0.31856000423431396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,16,1,power_law_1.01,0.20803840160369874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,16,1,power_law_1.01,0.20952320098876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,16,1,power_law_1.2,0.20565121173858641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,16,1,power_law_1.2,0.2070528030395508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,2,1,balanced,1.3987733523050945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,2,1,balanced,1.403018633524577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,2,1,power_law_1.01,0.933619213104248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,2,1,power_law_1.01,0.9541440010070801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,2,1,power_law_1.2,0.9205696105957031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,2,1,power_law_1.2,0.9389823913574219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,4,1,balanced,0.790234645207723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,4,1,balanced,0.7903947035471598
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,4,1,power_law_1.01,0.5435008049011231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,4,1,power_law_1.01,0.5471807956695557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,4,1,power_law_1.2,0.5254208087921143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,4,1,power_law_1.2,0.5366464138031006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,8,1,balanced,0.4505759874979655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,8,1,balanced,0.45099735260009766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,8,1,power_law_1.01,0.31297280788421633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,8,1,power_law_1.01,0.31329920291900637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,8,1,power_law_1.2,0.3063231945037842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,64,7168,2048,8,384,8,1,power_law_1.2,0.30838398933410643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,1,balanced,0.27138666311899823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,1,balanced,0.2714666724205017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,1,power_law_1.01,0.32239999771118166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,1,power_law_1.01,0.3235136032104492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,1,power_law_1.2,0.32536959648132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,1,power_law_1.2,0.32729599475860593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,128,balanced,0.09059199690818787
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,128,balanced,0.09303466478983562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,128,power_law_1.01,0.09370239973068237
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,128,power_law_1.01,0.09496319890022278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,128,power_law_1.2,0.09679359793663025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,128,power_law_1.2,0.09839360117912292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,16,balanced,0.10632000366846721
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,16,balanced,0.1067519982655843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,16,power_law_1.01,0.11250560283660889
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,16,power_law_1.01,0.11578880548477173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,16,power_law_1.2,0.11599999666213989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,16,power_law_1.2,0.11861759424209595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,2,balanced,0.1872533361117045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,2,balanced,0.18790932496388754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,2,power_law_1.01,0.2184448003768921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,2,power_law_1.01,0.23111679553985595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,2,power_law_1.2,0.22753279209136962
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,2,power_law_1.2,0.23404159545898437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,32,balanced,0.09635200103123982
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,32,balanced,0.10103999574979146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,32,power_law_1.01,0.10209280252456665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,32,power_law_1.01,0.1060863971710205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,32,power_law_1.2,0.10742399692535401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,32,power_law_1.2,0.10768640041351318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,4,balanced,0.1439520021279653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,4,balanced,0.1451466679573059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,4,power_law_1.01,0.1666815996170044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,4,power_law_1.01,0.16999679803848267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,4,power_law_1.2,0.16841599941253663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,4,power_law_1.2,0.16936320066452026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,64,balanced,0.09496532877286275
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,64,balanced,0.09548800190289815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,64,power_law_1.01,0.09683840274810791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,64,power_law_1.01,0.09742079973220825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,64,power_law_1.2,0.10037120580673217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,64,power_law_1.2,0.10097279548645019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,8,balanced,0.11707733074824016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,8,balanced,0.11715199549992879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,8,power_law_1.01,0.13639039993286134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,8,power_law_1.01,0.13678079843521118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,8,power_law_1.2,0.1382848024368286
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,1,8,power_law_1.2,0.13843200206756592
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,2,1,balanced,0.17042134205500284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,2,1,balanced,0.17082132895787558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,2,1,power_law_1.01,0.1993600010871887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,2,1,power_law_1.01,0.19944319725036622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,2,1,power_law_1.2,0.20154240131378173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,2048,768,8,128,2,1,power_law_1.2,0.20183680057525635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,1,balanced,1.1250879764556885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,1,balanced,1.1265599727630615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,1,power_law_1.01,1.1529855728149414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,1,power_law_1.01,1.165881633758545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,1,power_law_1.2,1.222879981994629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,1,power_law_1.2,1.235968017578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,128,balanced,0.17712533473968506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,128,balanced,0.17749333381652832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,128,power_law_1.01,0.1826367974281311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,128,power_law_1.01,0.18390400409698487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,128,power_law_1.2,0.18742400407791138
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,128,power_law_1.2,0.1884608030319214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,16,balanced,0.23674132426579794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,16,balanced,0.23736000061035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,16,power_law_1.01,0.2443392038345337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,16,power_law_1.01,0.24855680465698243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,16,power_law_1.2,0.2584127902984619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,16,power_law_1.2,0.2601471900939941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,2,balanced,0.6652746597925822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,2,balanced,0.6668960253397623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,2,power_law_1.01,0.6753024101257324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,2,power_law_1.01,0.689631986618042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,2,power_law_1.2,0.7118783950805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,2,power_law_1.2,0.7130303859710694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,256,balanced,0.17537067333857217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,256,balanced,0.1759200096130371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,256,power_law_1.01,0.17886719703674317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,256,power_law_1.01,0.17889280319213868
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,256,power_law_1.2,0.1823359966278076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,256,power_law_1.2,0.18411519527435302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,32,balanced,0.20148267348607382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,32,balanced,0.2023786703745524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,32,power_law_1.01,0.2163007974624634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,32,power_law_1.01,0.21810560226440429
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,32,power_law_1.2,0.22059519290924073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,32,power_law_1.2,0.22195839881896973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,4,balanced,0.42660800615946454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,4,balanced,0.42689065138498944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,4,power_law_1.01,0.4298367977142334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,4,power_law_1.01,0.43938560485839845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,4,power_law_1.2,0.4593535900115967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,4,power_law_1.2,0.4603775978088379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,64,balanced,0.18358933925628662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,64,balanced,0.18508267402648926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,64,power_law_1.01,0.19077119827270508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,64,power_law_1.01,0.19381760358810424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,64,power_law_1.2,0.195961594581604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,64,power_law_1.2,0.19854079484939574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,8,balanced,0.30157333612442017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,8,balanced,0.30245866378148395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,8,power_law_1.01,0.3144576072692871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,8,power_law_1.01,0.31956479549407957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,8,power_law_1.2,0.3226304054260254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,1,8,power_law_1.2,0.32585599422454836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,2,1,balanced,0.6367520093917847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,2,1,balanced,0.6369973421096802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,2,1,power_law_1.01,0.6558847904205323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,2,1,power_law_1.01,0.6631743907928467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,2,1,power_law_1.2,0.671776008605957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,2,1,power_law_1.2,0.6809023857116699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,4,1,balanced,0.3938239812850952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,4,1,balanced,0.3945173422495524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,4,1,power_law_1.01,0.39331200122833254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,4,1,power_law_1.01,0.39560320377349856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,4,1,power_law_1.2,0.40659198760986326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,3072,1536,8,256,4,1,power_law_1.2,0.42136321067810056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,1,balanced,1.2012053330739338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,1,balanced,1.2015093167622883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,1,power_law_1.01,1.4018943786621094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,1,power_law_1.01,1.4027263641357421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,1,power_law_1.2,1.3708415985107423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,1,power_law_1.2,1.377830410003662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,2,balanced,0.7641279697418213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,2,balanced,0.7669973373413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,2,power_law_1.01,0.8477503776550293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,2,power_law_1.01,1.0209919929504394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,2,power_law_1.2,0.9959744453430176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,2,power_law_1.2,1.0282048225402831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,4,balanced,0.48311467965443927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,4,balanced,0.4835520188013713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,4,power_law_1.01,0.7338624000549316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,4,power_law_1.01,0.7747583866119385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,4,power_law_1.2,0.7850751876831055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,4,power_law_1.2,0.8703743934631347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,8,balanced,0.40070398648579914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,8,balanced,0.40219732125600177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,8,power_law_1.01,0.6238143920898438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,8,power_law_1.01,0.6636288166046143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,8,power_law_1.2,0.7159872055053711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,1,8,power_law_1.2,0.7215871810913086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,16,1,balanced,0.14443733294804892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,16,1,balanced,0.14563733339309692
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,16,1,power_law_1.01,0.15066239833831788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,16,1,power_law_1.01,0.15269119739532472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,16,1,power_law_1.2,0.14974080324172973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,16,1,power_law_1.2,0.15161600112915039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,2,1,balanced,0.6322933435440063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,2,1,balanced,0.6350613435109457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,2,1,power_law_1.01,0.7114048004150391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,2,1,power_law_1.01,0.7163904190063477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,2,1,power_law_1.2,0.7191103935241699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,2,1,power_law_1.2,0.7223360061645507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,4,1,balanced,0.3449386755625407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,4,1,balanced,0.34621866544087726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,4,1,power_law_1.01,0.39444479942321775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,4,1,power_law_1.01,0.39534080028533936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,4,1,power_law_1.2,0.38747520446777345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,4,1,power_law_1.2,0.3899904012680054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,8,1,balanced,0.21099199851353964
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,8,1,balanced,0.2113599975903829
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,8,1,power_law_1.01,0.22337279319763184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,8,1,power_law_1.01,0.22359681129455566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,8,1,power_law_1.2,0.22306559085845948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,14336,2,8,8,1,power_law_1.2,0.22312960624694825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,1,balanced,0.798309326171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,1,balanced,0.8021653493245443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,1,power_law_1.01,1.009171199798584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,1,power_law_1.01,1.0347135543823243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,1,power_law_1.2,1.0515135765075683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,1,power_law_1.2,1.0549823760986328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,128,balanced,0.17114667097727457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,128,balanced,0.17119999726613364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,128,power_law_1.01,0.1761023998260498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,128,power_law_1.01,0.1774783968925476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,128,power_law_1.2,0.18936959505081177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,128,power_law_1.2,0.19298559427261353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,16,balanced,0.19987734158833823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,16,balanced,0.20110932985941568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,16,power_law_1.01,0.24368638992309571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,16,power_law_1.01,0.24744958877563478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,16,power_law_1.2,0.24713599681854248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,16,power_law_1.2,0.25655040740966795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,2,balanced,0.5008053382237753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,2,balanced,0.5018133322397867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,2,power_law_1.01,0.6232384204864502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,2,power_law_1.01,0.6307199954986572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,2,power_law_1.2,0.6361279964447022
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,2,power_law_1.2,0.6606847763061523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,32,balanced,0.17982399463653564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,32,balanced,0.18050666650136313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,32,power_law_1.01,0.20682239532470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,32,power_law_1.01,0.21049599647521972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,32,power_law_1.2,0.21418240070343017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,32,power_law_1.2,0.22042241096496581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,4,balanced,0.3277706702550252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,4,balanced,0.33030933141708374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,4,power_law_1.01,0.405401611328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,4,power_law_1.01,0.4084159851074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,4,power_law_1.2,0.42770562171936033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,4,power_law_1.2,0.44101758003234864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,64,balanced,0.17450666427612305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,64,balanced,0.17454399665196738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,64,power_law_1.01,0.185971200466156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,64,power_law_1.01,0.18762240409851075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,64,power_law_1.2,0.19535360336303711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,64,power_law_1.2,0.2022144079208374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,8,balanced,0.2476960023244222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,8,balanced,0.24820266167322794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,8,power_law_1.01,0.3040895938873291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,8,power_law_1.01,0.3099456071853638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,8,power_law_1.2,0.3097088098526001
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,1,8,power_law_1.2,0.316979193687439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,2,1,balanced,0.47118933995564777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,2,1,balanced,0.47274665037790936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,2,1,power_law_1.01,0.5650559902191162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,2,1,power_law_1.01,0.5673279762268066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,2,1,power_law_1.2,0.5703999996185303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,2,1,power_law_1.2,0.5722367763519287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,4,1,balanced,0.2906986673672994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,4,1,balanced,0.2909066677093506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,4,1,power_law_1.01,0.3468991994857788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,4,1,power_law_1.01,0.34771840572357177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,4,1,power_law_1.2,0.35047039985656736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,1536,8,128,4,1,power_law_1.2,0.35992960929870604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,1,balanced,4.927488009134929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,1,balanced,4.930639902750651
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,1,power_law_1.01,5.547129440307617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,1,power_law_1.01,5.643167877197266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,1,power_law_1.2,5.7648063659667965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,1,power_law_1.2,5.829689788818359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,128,balanced,0.615664005279541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,128,balanced,0.6158773501714071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,128,power_law_1.01,0.6488128185272217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,128,power_law_1.01,0.6536448001861572
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,128,power_law_1.2,0.6731904029846192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,128,power_law_1.2,0.6829887866973877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,16,balanced,0.8644213676452637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,16,balanced,0.8670453230539957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,16,power_law_1.01,0.9468735694885254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,16,power_law_1.01,0.9618047714233399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,16,power_law_1.2,0.9884544372558594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,16,power_law_1.2,1.0059776306152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,2,balanced,2.7860692342122397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,2,balanced,2.7898667653401694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,2,power_law_1.01,3.1513088226318358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,2,power_law_1.01,3.1615615844726563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,2,power_law_1.2,3.1732864379882812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,2,power_law_1.2,3.3082176208496095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,256,balanced,0.6012320121129354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,256,balanced,0.6026399930318197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,256,power_law_1.01,0.6322175979614257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,256,power_law_1.01,0.6393343925476074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,256,power_law_1.2,0.6418560028076172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,256,power_law_1.2,0.6546559810638428
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,32,balanced,0.7219999631245931
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,32,balanced,0.7234133084615072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,32,power_law_1.01,0.7809792041778565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,32,power_law_1.01,0.7973440170288086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,32,power_law_1.2,0.8040639877319335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,32,power_law_1.2,0.8216511726379394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,4,balanced,1.6924106280008953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,4,balanced,1.6976693471272786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,4,power_law_1.01,1.9056512832641601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,4,power_law_1.01,1.9080575942993163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,4,power_law_1.2,1.927168083190918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,4,power_law_1.2,2.0076351165771484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,64,balanced,0.6537226835886637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,64,balanced,0.6549866596857706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,64,power_law_1.01,0.69585280418396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,64,power_law_1.01,0.705625581741333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,64,power_law_1.2,0.7225215911865235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,64,power_law_1.2,0.7244480133056641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,8,balanced,1.145301342010498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,8,balanced,1.1486559708913167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,8,power_law_1.01,1.2784000396728517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,8,power_law_1.01,1.3013888359069825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,8,power_law_1.2,1.2902208328247071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,4096,2688,22,512,1,8,power_law_1.2,1.318336009979248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,1,balanced,1.855994701385498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,1,balanced,1.8561654090881348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,1,power_law_1.01,2.1411840438842775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,1,power_law_1.01,2.1728256225585936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,1,power_law_1.2,2.1552000045776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,1,power_law_1.2,2.164998435974121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,2,balanced,1.0652000109354656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,2,balanced,1.065930684407552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,2,power_law_1.01,1.4730751991271973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,2,power_law_1.01,1.555840015411377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,2,power_law_1.2,1.498252773284912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,2,power_law_1.2,1.5713024139404297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,4,balanced,0.6647733449935913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,4,balanced,0.6657013495763143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,4,power_law_1.01,1.1123519897460938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,4,power_law_1.01,1.142521572113037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,4,power_law_1.2,1.0907584190368653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,4,power_law_1.2,1.193734359741211
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,8,balanced,0.5103520154953003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,8,balanced,0.5120640198389689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,8,power_law_1.01,0.9142271995544433
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,8,power_law_1.01,0.9745087623596191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,8,power_law_1.2,0.9660160064697265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,1,8,power_law_1.2,1.0117183685302735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,16,1,balanced,0.2071146567662557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,16,1,balanced,0.20715733369191489
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,16,1,power_law_1.01,0.2130431890487671
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,16,1,power_law_1.01,0.21357440948486328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,16,1,power_law_1.2,0.2118527889251709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,16,1,power_law_1.2,0.21215999126434326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,2,1,balanced,0.9737599690755209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,2,1,balanced,0.975167989730835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,2,1,power_law_1.01,1.1101311683654784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,2,1,power_law_1.01,1.121504020690918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,2,1,power_law_1.2,1.1043007850646973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,2,1,power_law_1.2,1.1184191703796387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,32,1,balanced,0.13322133819262186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,32,1,balanced,0.13351999719937643
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,32,1,power_law_1.01,0.13601919412612914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,32,1,power_law_1.01,0.13670400381088257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,32,1,power_law_1.2,0.13628799915313722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,32,1,power_law_1.2,0.1367616057395935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,4,1,balanced,0.5405493179957072
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,4,1,balanced,0.5410293340682983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,4,1,power_law_1.01,0.6068287849426269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,4,1,power_law_1.01,0.6129856109619141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,4,1,power_law_1.2,0.5983424186706543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,4,1,power_law_1.2,0.6071167945861816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,8,1,balanced,0.30081067482630414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,8,1,balanced,0.30265067021052044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,8,1,power_law_1.01,0.35634560585021974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,8,1,power_law_1.01,0.3571775913238525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,8,1,power_law_1.2,0.34637439250946045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,16384,2,8,8,1,power_law_1.2,0.3603584051132202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,1,balanced,2.7253440221150718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,1,balanced,2.7260106404622397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,1,power_law_1.01,2.804435157775879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,1,power_law_1.01,2.824985694885254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,1,power_law_1.2,2.9668352127075197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,1,power_law_1.2,2.982156753540039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,128,balanced,0.28138667345046997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,128,balanced,0.2834666570027669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,128,power_law_1.01,0.2994368076324463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,128,power_law_1.01,0.30309760570526123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,128,power_law_1.2,0.3126976013183594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,128,power_law_1.2,0.3196608066558838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,16,balanced,0.42294931411743164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,16,balanced,0.42396267255147296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,16,power_law_1.01,0.4606207847595215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,16,power_law_1.01,0.4766143798828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,16,power_law_1.2,0.46666879653930665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,16,power_law_1.2,0.4792384147644043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,2,balanced,1.5095680554707844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,2,balanced,1.5121493339538574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,2,power_law_1.01,1.5647744178771972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,2,power_law_1.01,1.573977565765381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,2,power_law_1.2,1.633465576171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,2,power_law_1.2,1.6387008666992187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,256,balanced,0.2739253242810567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,256,balanced,0.27477333943049115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,256,power_law_1.01,0.28549120426177976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,256,power_law_1.01,0.28584320545196534
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,256,power_law_1.2,0.2932735919952393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,256,power_law_1.2,0.2952703952789307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,32,balanced,0.343120018641154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,32,balanced,0.3441386620203654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,32,power_law_1.01,0.36462719440460206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,32,power_law_1.01,0.3748032093048096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,32,power_law_1.2,0.38385279178619386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,32,power_law_1.2,0.38663039207458494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,4,balanced,0.8950453599294027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,4,balanced,0.8967626889546713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,4,power_law_1.01,0.9386624336242676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,4,power_law_1.01,0.9410623550415039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,4,power_law_1.2,0.9753151893615722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,4,power_law_1.2,0.9769791603088379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,64,balanced,0.30170132716496784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,64,balanced,0.30184000730514526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,64,power_law_1.01,0.32644479274749755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,64,power_law_1.01,0.32682878971099855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,64,power_law_1.2,0.33559679985046387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,64,power_law_1.2,0.3427135944366455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,8,balanced,0.5750506718953451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,8,balanced,0.5752426783243815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,8,power_law_1.01,0.6174975872039795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,8,power_law_1.01,0.6328703880310058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,8,power_law_1.2,0.6447103977203369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,1,8,power_law_1.2,0.6575039863586426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,16,1,balanced,0.40248533089955646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,16,1,balanced,0.4041706720987956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,16,1,power_law_1.01,0.4083583831787109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,16,1,power_law_1.01,0.40906238555908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,16,1,power_law_1.2,0.4387519836425781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,16,1,power_law_1.2,0.44118399620056153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,2,1,balanced,1.462458610534668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,2,1,balanced,1.464629332224528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,2,1,power_law_1.01,1.5187135696411134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,2,1,power_law_1.01,1.52674560546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,2,1,power_law_1.2,1.5764991760253906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,2,1,power_law_1.2,1.581984043121338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,4,1,balanced,0.6159733136494955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,4,1,balanced,0.6160800059636434
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,4,1,power_law_1.01,0.771398401260376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,4,1,power_law_1.01,0.7727935791015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,4,1,power_law_1.2,0.806828784942627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,4,1,power_law_1.2,0.8100288391113282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,8,1,balanced,0.444048007329305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,8,1,balanced,0.44787200291951496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,8,1,power_law_1.01,0.4567296028137207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,8,1,power_law_1.01,0.45703678131103515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,8,1,power_law_1.2,0.46448001861572263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2048,8,256,8,1,power_law_1.2,0.46474242210388184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,1,balanced,2.1909759839375815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,1,balanced,2.1918986638387046
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,1,power_law_1.01,2.6359487533569337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,1,power_law_1.01,2.654368019104004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,1,power_law_1.2,2.7190784454345702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,1,power_law_1.2,2.749523162841797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,16,balanced,0.37548800309499103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,16,balanced,0.3755413293838501
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,16,power_law_1.01,0.45452160835266114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,16,power_law_1.01,0.46448640823364257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,16,power_law_1.2,0.4642496109008789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,16,power_law_1.2,0.48085761070251465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,2,balanced,1.2344426314036052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,2,balanced,1.2362133661905925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,2,power_law_1.01,1.4484224319458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,2,power_law_1.01,1.4816448211669921
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,2,power_law_1.2,1.5609727859497071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,2,power_law_1.2,1.5911680221557618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,32,balanced,0.30899200836817425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,32,balanced,0.3107999960581462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,32,power_law_1.01,0.36414079666137694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,32,power_law_1.01,0.3714303970336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,32,power_law_1.2,0.3834496021270752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,32,power_law_1.2,0.38736639022827146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,4,balanced,0.7457919915517172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,4,balanced,0.7460373242696127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,4,power_law_1.01,0.8879679679870606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,4,power_law_1.01,0.9108736038208007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,4,power_law_1.2,0.9447232246398926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,4,power_law_1.2,0.9652031898498535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,8,balanced,0.4995306730270386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,8,balanced,0.4997546672821045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,8,power_law_1.01,0.5819007873535156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,8,power_law_1.01,0.6094592094421387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,8,power_law_1.2,0.6210239887237549
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,1,8,power_law_1.2,0.6257279872894287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,2,1,balanced,1.1778079668680828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,2,1,balanced,1.1783946355183919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,2,1,power_law_1.01,1.4258624076843263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,2,1,power_law_1.01,1.4375807762145996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,2,1,power_law_1.2,1.4606847763061523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,2,1,power_law_1.2,1.4671551704406738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,4,1,balanced,0.8547200361887614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,4,1,balanced,0.856170654296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,4,1,power_law_1.01,0.7927616119384766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,4,1,power_law_1.01,0.8035327911376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,4,1,power_law_1.2,0.8089792251586914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,6144,2560,8,160,4,1,power_law_1.2,0.8126655578613281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,1,balanced,3.1617066065470376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,1,balanced,3.1628106435139975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,1,power_law_1.01,3.2080001831054688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,1,power_law_1.01,3.2538688659667967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,1,power_law_1.2,3.447788619995117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,1,power_law_1.2,3.481363296508789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,128,balanced,0.30821333328882855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,128,balanced,0.308405339717865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,128,power_law_1.01,0.3276160001754761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,128,power_law_1.01,0.33333120346069334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,128,power_law_1.2,0.3417855978012085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,128,power_law_1.2,0.3508863925933838
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,16,balanced,0.4710986614227295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,16,balanced,0.4721226692199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,16,power_law_1.01,0.5073599815368652
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,16,power_law_1.01,0.5088319778442383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,16,power_law_1.2,0.5239871978759766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,16,power_law_1.2,0.5400832176208497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,2,balanced,1.740810712178548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,2,balanced,1.7426133155822754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,2,power_law_1.01,1.801241683959961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,2,power_law_1.01,1.8647872924804687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,2,power_law_1.2,1.8365184783935546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,2,power_law_1.2,1.893600082397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,256,balanced,0.3025173346201579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,256,balanced,0.3025386730829875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,256,power_law_1.01,0.3112512111663818
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,256,power_law_1.01,0.31456000804901124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,256,power_law_1.2,0.3240511894226074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,256,power_law_1.2,0.3278336048126221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,32,balanced,0.3776640097300212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,32,balanced,0.37852267424265545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,32,power_law_1.01,0.40634880065917967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,32,power_law_1.01,0.41471362113952637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,32,power_law_1.2,0.41906561851501467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,32,power_law_1.2,0.4387392044067383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,4,balanced,1.0218666394551594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,4,balanced,1.0240853627522786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,4,power_law_1.01,1.068607997894287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,4,power_law_1.01,1.0871999740600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,4,power_law_1.2,1.1188096046447753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,4,power_law_1.2,1.1445311546325683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,64,balanced,0.3278346657752991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,64,balanced,0.32949866851170856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,64,power_law_1.01,0.3530240058898926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,64,power_law_1.01,0.35528318881988524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,64,power_law_1.2,0.37336320877075196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,64,power_law_1.2,0.38949759006500245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,8,balanced,0.6482986609141032
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,8,balanced,0.6486239830652872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,8,power_law_1.01,0.6925439834594727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,8,power_law_1.01,0.7099199771881104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,8,power_law_1.2,0.7375552177429199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,1,8,power_law_1.2,0.7471231937408447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,16,1,balanced,0.46562135219573975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,16,1,balanced,0.46595199902852374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,16,1,power_law_1.01,0.4720128059387207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,16,1,power_law_1.01,0.47342720031738283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,16,1,power_law_1.2,0.4824063777923584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,16,1,power_law_1.2,0.5050111770629883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,2,1,balanced,1.7015520731608074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,2,1,balanced,1.703173319498698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,2,1,power_law_1.01,1.741542434692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,2,1,power_law_1.01,1.7948991775512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,2,1,power_law_1.2,1.8271743774414062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,2,1,power_law_1.2,1.8497600555419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,4,1,balanced,0.7116693655649821
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,4,1,balanced,0.7118933200836182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,4,1,power_law_1.01,0.8851840019226074
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,4,1,power_law_1.01,0.8896191596984864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,4,1,power_law_1.2,0.9383487701416016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,4,1,power_law_1.2,0.9428159713745117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,8,1,balanced,0.5095093250274658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,8,1,balanced,0.5112586816151937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,8,1,power_law_1.01,0.5290431976318359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,8,1,power_law_1.01,0.5291391849517822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,8,1,power_law_1.2,0.5336192131042481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,256,8,1,power_law_1.2,0.5373375892639161
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,1,balanced,4.6215254465738935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,1,balanced,4.624090512593587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,1,power_law_1.01,4.22355842590332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,1,power_law_1.01,4.23694076538086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,1,power_law_1.2,4.33436164855957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,1,power_law_1.2,4.351718521118164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,128,balanced,0.37325334548950195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,128,balanced,0.37351465225219727
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,128,power_law_1.01,0.38292479515075684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,128,power_law_1.01,0.3869055986404419
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,128,power_law_1.2,0.3964416027069092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,128,power_law_1.2,0.39898879528045655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,16,balanced,0.6143840154012045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,16,balanced,0.6153386831283569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,16,power_law_1.01,0.6067840099334717
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,16,power_law_1.01,0.6325632095336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,16,power_law_1.2,0.6375936031341553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,16,power_law_1.2,0.6643904209136963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,2,balanced,2.4943626721700034
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,2,balanced,2.495210647583008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,2,power_law_1.01,2.332863998413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,2,power_law_1.01,2.341721534729004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,2,power_law_1.2,2.3776575088500977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,2,power_law_1.2,2.4422527313232423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,32,balanced,0.48072532812754315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,32,balanced,0.4824426571528117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,32,power_law_1.01,0.48441600799560547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,32,power_law_1.01,0.5007743835449219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,32,power_law_1.2,0.4917247772216797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,32,power_law_1.2,0.5183680057525635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,4,balanced,1.42520538965861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,4,balanced,1.4290879567464192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,4,power_law_1.01,1.3615103721618653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,4,power_law_1.01,1.3719231605529785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,4,power_law_1.2,1.3457728385925294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,4,power_law_1.2,1.364863967895508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,64,balanced,0.4054826498031616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,64,balanced,0.40748266379038495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,64,power_law_1.01,0.4257215976715088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,64,power_law_1.01,0.43111681938171387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,64,power_law_1.2,0.4185215950012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,64,power_law_1.2,0.4234943866729736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,8,balanced,0.8890026410420736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,8,balanced,0.8897066911061605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,8,power_law_1.01,0.8605695724487304
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,8,power_law_1.01,0.8801792144775391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,8,power_law_1.2,0.8822527885437011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,1,8,power_law_1.2,0.9215423583984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,16,1,balanced,0.3511413335800171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,16,1,balanced,0.3522080183029175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,16,1,power_law_1.01,0.48070402145385743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,16,1,power_law_1.01,0.4831999778747559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,16,1,power_law_1.2,0.4843776226043701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,16,1,power_law_1.2,0.48508801460266116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,2,1,balanced,2.469226678212484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,2,1,balanced,2.470794677734375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,2,1,power_law_1.01,2.2642303466796876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,2,1,power_law_1.01,2.299456024169922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,2,1,power_law_1.2,2.3116416931152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,2,1,power_law_1.2,2.331699180603027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,4,1,balanced,1.4220800399780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,4,1,balanced,1.4252692858378093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,4,1,power_law_1.01,1.3033472061157227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,4,1,power_law_1.01,1.313868808746338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,4,1,power_law_1.2,1.35731201171875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,4,1,power_law_1.2,1.3575615882873535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,8,1,balanced,0.5280266602834066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,8,1,balanced,0.5292479991912842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,8,1,power_law_1.01,0.6273215770721435
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,8,1,power_law_1.01,0.6294528007507324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,8,1,power_law_1.2,0.6364672183990479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,768,7168,2048,8,384,8,1,power_law_1.2,0.645958423614502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,1,balanced,0.09129599730173747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,1,balanced,0.09437867005666097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,1,power_law_1.01,0.07137280106544494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,1,power_law_1.01,0.07439360022544861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,1,power_law_1.2,0.06835839748382569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,1,power_law_1.2,0.07097600102424621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,128,balanced,0.037461332976818085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,128,balanced,0.037685332198937736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,128,power_law_1.01,0.03485440015792847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,128,power_law_1.01,0.03594880104064942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,128,power_law_1.2,0.03487359881401062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,128,power_law_1.2,0.03537920117378235
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,16,balanced,0.03737599899371465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,16,balanced,0.03749866783618927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,16,power_law_1.01,0.03617919981479645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,16,power_law_1.01,0.036985599994659425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,16,power_law_1.2,0.036339199542999266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,16,power_law_1.2,0.03671039938926697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,2,balanced,0.06216000020503998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,2,balanced,0.06359466910362244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,2,power_law_1.01,0.05736960172653198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,2,power_law_1.01,0.058841598033905027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,2,power_law_1.2,0.055103999376296994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,2,power_law_1.2,0.056032001972198486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,32,balanced,0.03586133321126302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,32,balanced,0.037018666664759316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,32,power_law_1.01,0.035596799850463864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,32,power_law_1.01,0.03607040047645569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,32,power_law_1.2,0.03607679903507233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,32,power_law_1.2,0.03612799942493439
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,4,balanced,0.04423999786376953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,4,balanced,0.048698668678601585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,4,power_law_1.01,0.047891199588775635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,4,power_law_1.01,0.05011839866638183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,4,power_law_1.2,0.04953599870204926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,4,power_law_1.2,0.051558399200439455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,64,balanced,0.03563733398914337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,64,balanced,0.036415999134381614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,64,power_law_1.01,0.035071998834609985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,64,power_law_1.01,0.03516800105571747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,64,power_law_1.2,0.03560320138931274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,64,power_law_1.2,0.03627519905567169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,8,balanced,0.03770133356253306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,8,balanced,0.039093332986036934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,8,power_law_1.01,0.043219199776649474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,8,power_law_1.01,0.044947201013565065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,8,power_law_1.2,0.043084800243377686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,1,8,power_law_1.2,0.04419200122356415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,2,1,balanced,0.05996266504128774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,2,1,balanced,0.0617439995209376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,2,1,power_law_1.01,0.053273600339889524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,2,1,power_law_1.01,0.055027198791503903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,2,1,power_law_1.2,0.05087360143661499
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,2048,768,8,128,2,1,power_law_1.2,0.05180799961090088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,1,balanced,0.18293333053588867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,1,balanced,0.18353599309921265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,1,power_law_1.01,0.180511999130249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,1,power_law_1.01,0.18152960538864135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,1,power_law_1.2,0.17100160121917723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,1,power_law_1.2,0.17503360509872437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,128,balanced,0.04165333261092504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,128,balanced,0.04387199878692627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,128,power_law_1.01,0.041503998637199405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,128,power_law_1.01,0.043110400438308716
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,128,power_law_1.2,0.04170880019664765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,128,power_law_1.2,0.042444801330566405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,16,balanced,0.0479360024134318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,16,balanced,0.05086933573087057
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,16,power_law_1.01,0.07464960217475891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,16,power_law_1.01,0.07599999904632568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,16,power_law_1.2,0.07323520183563233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,16,power_law_1.2,0.07518720030784606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,2,balanced,0.12485333283742268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,2,balanced,0.12567466497421265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,2,power_law_1.01,0.13108479976654053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,2,power_law_1.01,0.1336192011833191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,2,power_law_1.2,0.1273151993751526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,2,power_law_1.2,0.12778240442276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,256,balanced,0.04228266576925913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,256,balanced,0.043696001172065735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,256,power_law_1.01,0.042208001017570496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,256,power_law_1.01,0.04247680008411407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,256,power_law_1.2,0.042719998955726625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,256,power_law_1.2,0.042771199345588685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,32,balanced,0.04354133208592733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,32,balanced,0.04383466641108195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,32,power_law_1.01,0.05885440111160278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,32,power_law_1.01,0.059673601388931276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,32,power_law_1.2,0.05920640230178833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,32,power_law_1.2,0.060147202014923094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,4,balanced,0.07673599819342296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,4,balanced,0.07973333199818929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,4,power_law_1.01,0.10774400234222412
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,4,power_law_1.01,0.1146239995956421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,4,power_law_1.2,0.10659840106964111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,4,power_law_1.2,0.10938880443572999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,64,balanced,0.041834667325019836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,64,balanced,0.042090664307276406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,64,power_law_1.01,0.04500479996204376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,64,power_law_1.01,0.0458624005317688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,64,power_law_1.2,0.044972801208496095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,64,power_law_1.2,0.045151999592781066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,8,balanced,0.058037335673967995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,8,balanced,0.062218666076660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,8,power_law_1.01,0.08524159789085388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,8,power_law_1.01,0.10209280252456665
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,8,power_law_1.2,0.08104959726333619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,1,8,power_law_1.2,0.08888319730758668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,2,1,balanced,0.11567466457684834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,2,1,balanced,0.12010133266448975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,2,1,power_law_1.01,0.11272959709167481
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,2,1,power_law_1.01,0.11384960412979125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,2,1,power_law_1.2,0.10810240507125854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,2,1,power_law_1.2,0.10983680486679077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,4,1,balanced,0.07250666618347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,4,1,balanced,0.07274666428565979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,4,1,power_law_1.01,0.07002239823341369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,4,1,power_law_1.01,0.07009919881820678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,4,1,power_law_1.2,0.06751999855041504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,3072,1536,8,256,4,1,power_law_1.2,0.06774399876594543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,1,balanced,0.2841973304748535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,1,balanced,0.28813334306081134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,1,power_law_1.01,0.2748863935470581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,1,power_law_1.01,0.27720959186553956
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,1,power_law_1.2,0.26819839477539065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,1,power_law_1.2,0.2781951904296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,2,balanced,0.1969226598739624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,2,balanced,0.20096532503763834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,2,power_law_1.01,0.1882688045501709
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,2,power_law_1.01,0.1899072051048279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,2,power_law_1.2,0.18679039478302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,2,power_law_1.2,0.18992639780044557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,4,balanced,0.1444586714108785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,4,balanced,0.15438933173815408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,4,power_law_1.01,0.1427839994430542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,4,power_law_1.01,0.1434175968170166
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,4,power_law_1.2,0.14897279739379882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,4,power_law_1.2,0.17557120323181152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,8,balanced,0.12601600090662637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,8,balanced,0.12667199969291687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,8,power_law_1.01,0.12755839824676513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,8,power_law_1.01,0.1281599998474121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,8,power_law_1.2,0.127839994430542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,1,8,power_law_1.2,0.127948796749115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,16,1,balanced,0.05106666684150696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,16,1,balanced,0.05179200073083242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,16,1,power_law_1.01,0.04917759895324707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,16,1,power_law_1.01,0.05080320239067078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,16,1,power_law_1.2,0.049209600687026976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,16,1,power_law_1.2,0.04999040067195892
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,2,1,balanced,0.159578671058019
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,2,1,balanced,0.16134400169054666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,2,1,power_law_1.01,0.15571839809417726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,2,1,power_law_1.01,0.1577280044555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,2,1,power_law_1.2,0.1566848039627075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,2,1,power_law_1.2,0.16104960441589355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,4,1,balanced,0.09300800164540608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,4,1,balanced,0.10017066200574239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,4,1,power_law_1.01,0.08700799942016602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,4,1,power_law_1.01,0.08817920088768005
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,4,1,power_law_1.2,0.08870400190353393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,4,1,power_law_1.2,0.0904640018939972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,8,1,balanced,0.06589333216349284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,8,1,balanced,0.06619733572006226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,8,1,power_law_1.01,0.06323840022087097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,8,1,power_law_1.01,0.0644864022731781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,8,1,power_law_1.2,0.0640447974205017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,14336,2,8,8,1,power_law_1.2,0.06424959897994995
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,1,balanced,0.23365867137908936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,1,balanced,0.23546665906906128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,1,power_law_1.01,0.18257280588150024
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,1,power_law_1.01,0.18739839792251586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,1,power_law_1.2,0.16921600103378295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,1,power_law_1.2,0.17056000232696533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,128,balanced,0.04586133360862732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,128,balanced,0.04795200129350027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,128,power_law_1.01,0.04480000138282776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,128,power_law_1.01,0.04514560103416443
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,128,power_law_1.2,0.04488320052623749
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,128,power_law_1.2,0.0463808000087738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,16,balanced,0.05524266759554545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,16,balanced,0.056128000219662987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,16,power_law_1.01,0.06387839913368225
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,16,power_law_1.01,0.06427519917488098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,16,power_law_1.2,0.06250240206718445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,16,power_law_1.2,0.06350719928741455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,2,balanced,0.15156267086664835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,2,balanced,0.15516266226768494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,2,power_law_1.01,0.1373247981071472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,2,power_law_1.01,0.14234880208969117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,2,power_law_1.2,0.12168320417404174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,2,power_law_1.2,0.13207039833068848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,32,balanced,0.04693333307902018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,32,balanced,0.04809066653251648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,32,power_law_1.01,0.051545602083206174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,32,power_law_1.01,0.05367680191993714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,32,power_law_1.2,0.05130879878997803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,32,power_law_1.2,0.05335680246353149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,4,balanced,0.08878399928410848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,4,balanced,0.08959999680519104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,4,power_law_1.01,0.0944320023059845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,4,power_law_1.01,0.10188800096511841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,4,power_law_1.2,0.09278079867362976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,4,power_law_1.2,0.09334400296211243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,64,balanced,0.045791998505592346
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,64,balanced,0.04610133171081543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,64,power_law_1.01,0.045151999592781066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,64,power_law_1.01,0.04590719938278198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,64,power_law_1.2,0.04550400078296661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,64,power_law_1.2,0.045535999536514285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,8,balanced,0.07041066884994507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,8,balanced,0.07046400010585785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,8,power_law_1.01,0.0738431990146637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,8,power_law_1.01,0.08135039806365967
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,8,power_law_1.2,0.07979519963264466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,1,8,power_law_1.2,0.0858560025691986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,2,1,balanced,0.15195199847221375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,2,1,balanced,0.15260799725850424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,2,1,power_law_1.01,0.11342079639434814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,2,1,power_law_1.01,0.11703679561614991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,2,1,power_law_1.2,0.10349440574645996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,2,1,power_law_1.2,0.10371199846267701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,4,1,balanced,0.09197333455085754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,4,1,balanced,0.0922879974047343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,4,1,power_law_1.01,0.07600640058517456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,4,1,power_law_1.01,0.07998719811439514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,4,1,power_law_1.2,0.07464960217475891
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,1536,8,128,4,1,power_law_1.2,0.07486079931259156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,1,balanced,0.9504319826761881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,1,balanced,0.9587146441141764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,1,power_law_1.01,0.8356927871704102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,1,power_law_1.01,0.8717056274414062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,1,power_law_1.2,0.7615424156188965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,1,power_law_1.2,0.7828032016754151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,128,balanced,0.07081066568692525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,128,balanced,0.07211199899514516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,128,power_law_1.01,0.07477759718894958
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,128,power_law_1.01,0.075135999917984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,128,power_law_1.2,0.07217919826507568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,128,power_law_1.2,0.07315199971199035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,16,balanced,0.14131200313568115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,16,balanced,0.1435466706752777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,16,power_law_1.01,0.22501759529113768
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,16,power_law_1.01,0.22560639381408693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,16,power_law_1.2,0.22401280403137208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,16,power_law_1.2,0.22440319061279296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,2,balanced,0.5198666652043661
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,2,balanced,0.5223093430201212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,2,power_law_1.01,0.5167232036590577
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,2,power_law_1.01,0.5309184074401856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,2,power_law_1.2,0.4951807975769043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,2,power_law_1.2,0.5067455768585205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,256,balanced,0.05901333192984263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,256,balanced,0.05991999804973602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,256,power_law_1.01,0.05785599946975708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,256,power_law_1.01,0.06124160289764404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,256,power_law_1.2,0.06188160181045532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,256,power_law_1.2,0.06376960277557372
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,32,balanced,0.1027786632378896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,32,balanced,0.10467200477917989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,32,power_law_1.01,0.14087040424346925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,32,power_law_1.01,0.14118399620056152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,32,power_law_1.2,0.13960319757461548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,32,power_law_1.2,0.14161920547485352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,4,balanced,0.3046879967053731
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,4,balanced,0.30565865834554035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,4,power_law_1.01,0.3752703905105591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,4,power_law_1.01,0.39679999351501466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,4,power_law_1.2,0.3522432088851929
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,4,power_law_1.2,0.3837120056152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,64,balanced,0.08469333251317342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,64,balanced,0.08516266942024231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,64,power_law_1.01,0.08657280206680298
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,64,power_law_1.01,0.09027199745178223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,64,power_law_1.2,0.08917120099067688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,64,power_law_1.2,0.08938239812850952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,8,balanced,0.19040000438690186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,8,balanced,0.1923146645228068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,8,power_law_1.01,0.2891200065612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,8,power_law_1.01,0.30582399368286134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,8,power_law_1.2,0.29171199798583985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,4096,2688,22,512,1,8,power_law_1.2,0.299238395690918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,1,balanced,0.4456373453140259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,1,balanced,0.4472586711247762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,1,power_law_1.01,0.41502718925476073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,1,power_law_1.01,0.4303936004638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,1,power_law_1.2,0.43047680854797366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,1,power_law_1.2,0.43656320571899415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,2,balanced,0.2731786568959554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,2,balanced,0.3002506693204244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,2,power_law_1.01,0.26056320667266847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,2,power_law_1.01,0.2755392074584961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,2,power_law_1.2,0.26626560688018797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,2,power_law_1.2,0.26912000179290774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,4,balanced,0.18714666366577148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,4,balanced,0.18892266352971396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,4,power_law_1.01,0.18585599660873414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,4,power_law_1.01,0.1866752028465271
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,4,power_law_1.2,0.18568320274353028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,4,power_law_1.2,0.1857792019844055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,8,balanced,0.16004799803098044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,8,balanced,0.16051200032234192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,8,power_law_1.01,0.1577407956123352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,8,power_law_1.01,0.15841920375823976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,8,power_law_1.2,0.157151997089386
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,1,8,power_law_1.2,0.17842559814453124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,16,1,balanced,0.06841066479682922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,16,1,balanced,0.06902400155862172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,16,1,power_law_1.01,0.06595839858055115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,16,1,power_law_1.01,0.06662399768829345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,16,1,power_law_1.2,0.06659839749336242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,16,1,power_law_1.2,0.06721280217170715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,2,1,balanced,0.23503466447194418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,2,1,balanced,0.2379093368848165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,2,1,power_law_1.01,0.22755839824676513
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,2,1,power_law_1.01,0.23221120834350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,2,1,power_law_1.2,0.2322943925857544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,2,1,power_law_1.2,0.2339776039123535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,32,1,balanced,0.0547626664241155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,32,1,balanced,0.05817066629727682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,32,1,power_law_1.01,0.054579198360443115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,32,1,power_law_1.01,0.05551360249519348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,32,1,power_law_1.2,0.055276799201965335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,32,1,power_law_1.2,0.05627520084381103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,4,1,balanced,0.1338986655076345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,4,1,balanced,0.16478400429089865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,4,1,power_law_1.01,0.12638720273971557
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,4,1,power_law_1.01,0.12848000526428222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,4,1,power_law_1.2,0.12728960514068605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,4,1,power_law_1.2,0.13156479597091675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,8,1,balanced,0.09066667159398396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,8,1,balanced,0.0953546663125356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,8,1,power_law_1.01,0.08828160166740417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,8,1,power_law_1.01,0.08922880291938781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,8,1,power_law_1.2,0.08515840172767639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,16384,2,8,8,1,power_law_1.2,0.08544639945030212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,1,balanced,0.43560532728830975
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,1,balanced,0.4371573527654012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,1,power_law_1.01,0.43143677711486816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,1,power_law_1.01,0.4340928077697754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,1,power_law_1.2,0.4111040115356445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,1,power_law_1.2,0.4134079933166504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,128,balanced,0.05412800113360087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,128,balanced,0.05609600245952606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,128,power_law_1.01,0.06101120114326477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,128,power_law_1.01,0.06632320284843445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,128,power_law_1.2,0.06095359921455383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,128,power_law_1.2,0.06461439728736877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,16,balanced,0.08125866452852885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,16,balanced,0.0813973347345988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,16,power_law_1.01,0.14088319540023803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,16,power_law_1.01,0.1415743947029114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,16,power_law_1.2,0.14094719886779786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,16,power_law_1.2,0.14158719778060913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,2,balanced,0.2405173381169637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,2,balanced,0.2412266731262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,2,power_law_1.01,0.288921594619751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,2,power_law_1.01,0.291596794128418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,2,power_law_1.2,0.26836481094360354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,2,power_law_1.2,0.27915520668029786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,256,balanced,0.05602133274078369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,256,balanced,0.056128000219662987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,256,power_law_1.01,0.0545087993144989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,256,power_law_1.01,0.054764801263809205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,256,power_law_1.2,0.05430399775505066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,256,power_law_1.2,0.05663999915122986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,32,balanced,0.06003733476003011
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,32,balanced,0.0681279997030894
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,32,power_law_1.01,0.09687680006027222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,32,power_law_1.01,0.0978879988193512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,32,power_law_1.2,0.09618560075759888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,32,power_law_1.2,0.0970304012298584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,4,balanced,0.14468800028165182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,4,balanced,0.14616533120473227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,4,power_law_1.01,0.22524800300598144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,4,power_law_1.01,0.23053441047668458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,4,power_law_1.2,0.2208575963973999
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,4,power_law_1.2,0.22357759475708008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,64,balanced,0.05606399973233541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,64,balanced,0.05611200133959452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,64,power_law_1.01,0.07862399816513062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,64,power_law_1.01,0.07886080145835876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,64,power_law_1.2,0.0766207993030548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,64,power_law_1.2,0.07682560086250305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,8,balanced,0.09310932954152425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,8,balanced,0.09470933675765991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,8,power_law_1.01,0.18198399543762206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,8,power_law_1.01,0.19141759872436523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,8,power_law_1.2,0.1826688051223755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,1,8,power_law_1.2,0.18379520177841185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,16,1,balanced,0.07629333436489105
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,16,1,balanced,0.07720000048478444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,16,1,power_law_1.01,0.07475200295448303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,16,1,power_law_1.01,0.07493119835853576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,16,1,power_law_1.2,0.07418879866600037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,16,1,power_law_1.2,0.07471359968185425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,2,1,balanced,0.2308853268623352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,2,1,balanced,0.23170665899912515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,2,1,power_law_1.01,0.2280832052230835
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,2,1,power_law_1.01,0.22874879837036133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,2,1,power_law_1.2,0.21386239528656006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,2,1,power_law_1.2,0.2165503978729248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,4,1,balanced,0.13652799526850382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,4,1,balanced,0.1378613313039144
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,4,1,power_law_1.01,0.1344831943511963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,4,1,power_law_1.01,0.1360576033592224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,4,1,power_law_1.2,0.1269503951072693
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,4,1,power_law_1.2,0.12736639976501465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,8,1,balanced,0.09874133268992107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,8,1,balanced,0.0995840032895406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,8,1,power_law_1.01,0.09666560292243957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,8,1,power_law_1.01,0.0982912003993988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,8,1,power_law_1.2,0.09381120204925537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2048,8,256,8,1,power_law_1.2,0.09402239918708802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,1,balanced,0.5336480140686035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,1,balanced,0.5356533527374268
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,1,power_law_1.01,0.4432703971862793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,1,power_law_1.01,0.4536640167236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,1,power_law_1.2,0.40694398880004884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,1,power_law_1.2,0.41225600242614746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,16,balanced,0.08621333042780559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,16,balanced,0.08666132887204488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,16,power_law_1.01,0.11674879789352417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,16,power_law_1.01,0.1176192045211792
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,16,power_law_1.2,0.1185920000076294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,16,power_law_1.2,0.1192639946937561
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,2,balanced,0.3021226723988851
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,2,balanced,0.30235199133555096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,2,power_law_1.01,0.2926464080810547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,2,power_law_1.01,0.3150592088699341
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,2,power_law_1.2,0.27022080421447753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,2,power_law_1.2,0.27526400089263914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,32,balanced,0.07242133220036824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,32,balanced,0.07449600100517273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,32,power_law_1.01,0.08794239759445191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,32,power_law_1.01,0.0886080026626587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,32,power_law_1.2,0.08447999954223633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,32,power_law_1.2,0.08471680283546448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,4,balanced,0.17615467309951782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,4,balanced,0.1763413349787394
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,4,power_law_1.01,0.19619840383529663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,4,power_law_1.01,0.20703999996185302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,4,power_law_1.2,0.19319679737091064
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,4,power_law_1.2,0.198361599445343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,8,balanced,0.10410133004188538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,8,balanced,0.10641066233317058
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,8,power_law_1.01,0.16311039924621581
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,8,power_law_1.01,0.17191040515899658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,8,power_law_1.2,0.16275839805603026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,1,8,power_law_1.2,0.17404799461364745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,2,1,balanced,0.30082666873931885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,2,1,balanced,0.3011680046717326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,2,1,power_law_1.01,0.24294400215148926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,2,1,power_law_1.01,0.24327681064605713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,2,1,power_law_1.2,0.224236798286438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,2,1,power_law_1.2,0.22652161121368408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,4,1,balanced,0.18552533785502115
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,4,1,balanced,0.18621333440144858
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,4,1,power_law_1.01,0.13935999870300292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,4,1,power_law_1.01,0.1395967960357666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,4,1,power_law_1.2,0.13052799701690673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,6144,2560,8,160,4,1,power_law_1.2,0.1324671983718872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,1,balanced,0.49882666269938153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,1,balanced,0.5010613203048706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,1,power_law_1.01,0.49918718338012696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,1,power_law_1.01,0.5003456115722656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,1,power_law_1.2,0.4704063892364502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,1,power_law_1.2,0.473203182220459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,128,balanced,0.06005333364009857
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,128,balanced,0.0618453323841095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,128,power_law_1.01,0.07126399874687195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,128,power_law_1.01,0.07215359807014465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,128,power_law_1.2,0.07141759991645813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,128,power_law_1.2,0.07286400198936463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,16,balanced,0.08713066577911377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,16,balanced,0.08740267157554626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,16,power_law_1.01,0.15514880418777466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,16,power_law_1.01,0.15780479907989503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,16,power_law_1.2,0.1506432056427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,16,power_law_1.2,0.1562880039215088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,2,balanced,0.2734453280766805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,2,balanced,0.27345067262649536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,2,power_law_1.01,0.3341248035430908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,2,power_law_1.01,0.3513472080230713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,2,power_law_1.2,0.3012480020523071
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,2,power_law_1.2,0.309497594833374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,256,balanced,0.060191998879114784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,256,balanced,0.06427733103434245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,256,power_law_1.01,0.058220797777175905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,256,power_law_1.01,0.05896959900856018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,256,power_law_1.2,0.05902720093727112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,256,power_law_1.2,0.05912320017814636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,32,balanced,0.07367999851703644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,32,balanced,0.07771733403205872
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,32,power_law_1.01,0.10578559637069702
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,32,power_law_1.01,0.10586880445480347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,32,power_law_1.2,0.10521600246429444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,32,power_law_1.2,0.10540800094604492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,4,balanced,0.16024532914161682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,4,balanced,0.1622880001862844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,4,power_law_1.01,0.25700480937957765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,4,power_law_1.01,0.2643071889877319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,4,power_law_1.2,0.23220479488372803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,4,power_law_1.2,0.23864960670471191
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,64,balanced,0.060005332032839455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,64,balanced,0.06437333424886067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,64,power_law_1.01,0.08515200018882751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,64,power_law_1.01,0.08568320274353028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,64,power_law_1.2,0.08280959725379944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,64,power_law_1.2,0.08655999898910523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,8,balanced,0.11040000120798747
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,8,balanced,0.11079999804496765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,8,power_law_1.01,0.19537919759750366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,8,power_law_1.01,0.21870079040527343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,8,power_law_1.2,0.20367999076843263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,1,8,power_law_1.2,0.2076416015625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,16,1,balanced,0.08469333251317342
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,16,1,balanced,0.08494399984677632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,16,1,power_law_1.01,0.08343679904937744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,16,1,power_law_1.01,0.08394240140914917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,16,1,power_law_1.2,0.08202880024909973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,16,1,power_law_1.2,0.0828607976436615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,2,1,balanced,0.25997867186864215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,2,1,balanced,0.2600586613019307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,2,1,power_law_1.01,0.26114559173583984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,2,1,power_law_1.01,0.26117119789123533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,2,1,power_law_1.2,0.2438271999359131
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,2,1,power_law_1.2,0.2477247953414917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,4,1,balanced,0.15242133537928262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,4,1,balanced,0.15383467078208923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,4,1,power_law_1.01,0.15081599950790406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,4,1,power_law_1.01,0.15162240266799926
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,4,1,power_law_1.2,0.14357759952545165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,4,1,power_law_1.2,0.14380160570144654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,8,1,balanced,0.11025066177050273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,8,1,balanced,0.11100799838701884
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,8,1,power_law_1.01,0.10917119979858399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,8,1,power_law_1.01,0.1093567967414856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,8,1,power_law_1.2,0.10391680002212525
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,256,8,1,power_law_1.2,0.1056447982788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,1,balanced,0.5005813439687093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,1,balanced,0.5038026571273804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,1,power_law_1.01,0.4985663890838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,1,power_law_1.01,0.4999743938446045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,1,power_law_1.2,0.5003392219543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,1,power_law_1.2,0.5017983913421631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,128,balanced,0.06020799775918325
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,128,balanced,0.06197333335876465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,128,power_law_1.01,0.07895680069923401
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,128,power_law_1.01,0.07912319898605347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,128,power_law_1.2,0.07886719703674316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,128,power_law_1.2,0.07984640002250672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,16,balanced,0.08718400200208028
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,16,balanced,0.08846933643023173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,16,power_law_1.01,0.2320512056350708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,16,power_law_1.01,0.23517439365386963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,16,power_law_1.2,0.23440639972686766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,16,power_law_1.2,0.2370368003845215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,2,balanced,0.27425066630045575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,2,balanced,0.27453333139419556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,2,power_law_1.01,0.3608831882476807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,2,power_law_1.01,0.3643712043762207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,2,power_law_1.2,0.34622080326080323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,2,power_law_1.2,0.3549567937850952
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,32,balanced,0.07448533177375793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,32,balanced,0.0766186664501826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,32,power_law_1.01,0.13516160249710082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,32,power_law_1.01,0.13761919736862183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,32,power_law_1.2,0.13575040102005004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,32,power_law_1.2,0.13685120344161988
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,4,balanced,0.15820800264676413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,4,balanced,0.1601599951585134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,4,power_law_1.01,0.2758016109466553
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,4,power_law_1.01,0.2838144063949585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,4,power_law_1.2,0.2691904067993164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,4,power_law_1.2,0.27565441131591795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,64,balanced,0.06181333462397257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,64,balanced,0.06427200138568878
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,64,power_law_1.01,0.0936959981918335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,64,power_law_1.01,0.09413120150566101
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,64,power_law_1.2,0.09292160272598267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,64,power_law_1.2,0.09349120259284974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,8,balanced,0.10713600118954976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,8,balanced,0.10791466633478801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,8,power_law_1.01,0.2622143983840942
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,8,power_law_1.01,0.2705535888671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,8,power_law_1.2,0.2522815942764282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,1,8,power_law_1.2,0.25290238857269287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,16,1,balanced,0.07932800054550171
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,16,1,balanced,0.08052266637484233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,16,1,power_law_1.01,0.07734400033950806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,16,1,power_law_1.01,0.07825919985771179
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,16,1,power_law_1.2,0.07820799946784973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,16,1,power_law_1.2,0.07828480005264282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,2,1,balanced,0.26064532995224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,2,1,balanced,0.26173333326975506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,2,1,power_law_1.01,0.2594239950180054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,2,1,power_law_1.01,0.2602240085601807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,2,1,power_law_1.2,0.2593408107757568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,2,1,power_law_1.2,0.26065280437469485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,4,1,balanced,0.1532586713631948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,4,1,balanced,0.1544426679611206
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,4,1,power_law_1.01,0.1505280017852783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,4,1,power_law_1.01,0.15146880149841307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,4,1,power_law_1.2,0.15185279846191407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,4,1,power_law_1.2,0.15203200578689574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,8,1,balanced,0.10149866342544556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,8,1,balanced,0.10152000188827515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,8,1,power_law_1.01,0.10080000162124633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,8,1,power_law_1.01,0.10096640586853027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,8,1,power_law_1.2,0.10026880502700805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8,7168,2048,8,384,8,1,power_law_1.2,0.10028159618377686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,1,balanced,0.143994669119517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,1,balanced,0.14415466785430908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,1,power_law_1.01,0.1364159941673279
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,1,power_law_1.01,0.1364799976348877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,1,power_law_1.2,0.1359935998916626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,1,power_law_1.2,0.1381183981895447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,128,balanced,0.05157866577307383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,128,balanced,0.052144000927607216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,128,power_law_1.01,0.04922879934310913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,128,power_law_1.01,0.049644801020622256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,128,power_law_1.2,0.04936319887638092
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,128,power_law_1.2,0.04947839975357056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,16,balanced,0.05600533386071523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,16,balanced,0.05765866736570994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,16,power_law_1.01,0.055257600545883176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,16,power_law_1.01,0.0553600013256073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,16,power_law_1.2,0.055257600545883176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,16,power_law_1.2,0.05559679865837097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,2,balanced,0.13700266679128012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,2,balanced,0.13838932911554971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,2,power_law_1.01,0.13306879997253418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,2,power_law_1.01,0.1332352042198181
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,2,power_law_1.2,0.1341055989265442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,2,power_law_1.2,0.13454079627990723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,32,balanced,0.05407999952634176
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,32,balanced,0.05417066812515259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,32,power_law_1.01,0.05316479802131653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,32,power_law_1.01,0.05334399938583374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,32,power_law_1.2,0.051283198595047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,32,power_law_1.2,0.053401601314544675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,4,balanced,0.09754133224487305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,4,balanced,0.09905067086219788
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,4,power_law_1.01,0.09594240188598632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,4,power_law_1.01,0.09607040286064147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,4,power_law_1.2,0.09591680169105529
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,4,power_law_1.2,0.09648640155792236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,64,balanced,0.05073600014050802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,64,balanced,0.05116266508897146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,64,power_law_1.01,0.05008000135421753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,64,power_law_1.01,0.050393599271774295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,64,power_law_1.2,0.05125120282173157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,64,power_law_1.2,0.05129600167274475
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,8,balanced,0.06598400076230367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,8,balanced,0.06665066878000896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,8,power_law_1.01,0.06496000289916992
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,8,power_law_1.01,0.0650111973285675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,8,power_law_1.2,0.06388480067253113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,1,8,power_law_1.2,0.06639360189437866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,2,1,balanced,0.09955199559529622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,2,1,balanced,0.10162132978439331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,2,1,power_law_1.01,0.09509119987487794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,2,1,power_law_1.01,0.09534720182418824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,2,1,power_law_1.2,0.09590399861335755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,2048,768,8,128,2,1,power_law_1.2,0.09645439982414246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,1,balanced,1.0186080137888591
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,1,balanced,1.0195573170979817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,1,power_law_1.01,0.8268863677978515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,1,power_law_1.01,0.8372672080993653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,1,power_law_1.2,0.8134783744812012
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,1,power_law_1.2,0.8158592224121094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,128,balanced,0.094842662413915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,128,balanced,0.09492266178131104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,128,power_law_1.01,0.09437440037727356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,128,power_law_1.01,0.09440640211105347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,128,power_law_1.2,0.09419519901275634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,128,power_law_1.2,0.09437440037727356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,16,balanced,0.15119466185569763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,16,balanced,0.152346670627594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,16,power_law_1.01,0.14727040529251098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,16,power_law_1.01,0.14939520359039307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,16,power_law_1.2,0.13891839981079102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,16,power_law_1.2,0.14765440225601195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,2,balanced,0.5583146810531616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,2,balanced,0.5656853516896566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,2,power_law_1.01,0.4793856143951416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,2,power_law_1.01,0.48000001907348633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,2,power_law_1.2,0.4546495914459229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,2,power_law_1.2,0.47356162071228025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,256,balanced,0.09283199906349182
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,256,balanced,0.09319999814033508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,256,power_law_1.01,0.0917568027973175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,256,power_law_1.01,0.091839998960495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,256,power_law_1.2,0.09215999841690063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,256,power_law_1.2,0.0923520028591156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,32,balanced,0.11948800086975098
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,32,balanced,0.12217600146929423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,32,power_law_1.01,0.11683199405670167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,32,power_law_1.01,0.11695359945297241
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,32,power_law_1.2,0.11162879467010497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,32,power_law_1.2,0.11442559957504272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,4,balanced,0.32839999596277875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,4,balanced,0.3307680090268453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,4,power_law_1.01,0.28744959831237793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,4,power_law_1.01,0.2919872045516968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,4,power_law_1.2,0.28872320652008054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,4,power_law_1.2,0.29719679355621337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,64,balanced,0.10097600022951762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,64,balanced,0.10327999790509541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,64,power_law_1.01,0.09884799718856811
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,64,power_law_1.01,0.10152959823608398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,64,power_law_1.2,0.09773439764976502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,64,power_law_1.2,0.09893760085105896
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,8,balanced,0.20997333526611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,8,balanced,0.21308799584706625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,8,power_law_1.01,0.19279359579086303
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,8,power_law_1.01,0.1955839991569519
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,8,power_law_1.2,0.19326720237731934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,1,8,power_law_1.2,0.1956928014755249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,2,1,balanced,0.5701546669006348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,2,1,balanced,0.571013331413269
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,2,1,power_law_1.01,0.45403518676757815
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,2,1,power_law_1.01,0.4678656101226807
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,2,1,power_law_1.2,0.4475071907043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,2,1,power_law_1.2,0.45996799468994143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,4,1,balanced,0.34426132837931317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,4,1,balanced,0.34625065326690674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,4,1,power_law_1.01,0.2788095951080322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,4,1,power_law_1.01,0.2819008111953735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,4,1,power_law_1.2,0.2784832000732422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,3072,1536,8,256,4,1,power_law_1.2,0.28027520179748533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,1,balanced,0.4484746853510539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,1,balanced,0.4485493501027425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,1,power_law_1.01,0.4492671966552734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,1,power_law_1.01,0.44968318939208984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,1,power_law_1.2,0.44924159049987794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,1,power_law_1.2,0.4517632007598877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,2,balanced,0.3238133390744527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,2,balanced,0.32850666840871173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,2,power_law_1.01,0.3166719913482666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,2,power_law_1.01,0.3240447998046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,2,power_law_1.2,0.3172672033309937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,2,power_law_1.2,0.3285376071929932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,4,balanced,0.25217066208521527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,4,balanced,0.2523413300514221
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,4,power_law_1.01,0.2560960054397583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,4,power_law_1.01,0.26820480823516846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,4,power_law_1.2,0.26301438808441163
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,4,power_law_1.2,0.26537599563598635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,8,balanced,0.21820267041524252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,8,balanced,0.21845867236455283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,8,power_law_1.01,0.2148672103881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,8,power_law_1.01,0.22542080879211426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,8,power_law_1.2,0.21473920345306396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,1,8,power_law_1.2,0.24176640510559083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,16,1,balanced,0.07048533360163371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,16,1,balanced,0.07322666545708974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,16,1,power_law_1.01,0.06776319742202759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,16,1,power_law_1.01,0.06948480010032654
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,16,1,power_law_1.2,0.07062399983406067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,16,1,power_law_1.2,0.07397119998931885
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,2,1,balanced,0.25443732738494873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,2,1,balanced,0.2556533416112264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,2,1,power_law_1.01,0.25292799472808836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,2,1,power_law_1.01,0.2530751943588257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,2,1,power_law_1.2,0.24746880531311036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,2,1,power_law_1.2,0.2551680088043213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,4,1,balanced,0.14453333616256714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,4,1,balanced,0.15069866180419922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,4,1,power_law_1.01,0.14249600172042848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,4,1,power_law_1.01,0.14361599683761597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,4,1,power_law_1.2,0.14303359985351563
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,4,1,power_law_1.2,0.14404480457305907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,8,1,balanced,0.08872532844543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,8,1,balanced,0.08941866954167683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,8,1,power_law_1.01,0.0880128026008606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,8,1,power_law_1.01,0.08812159895896912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,8,1,power_law_1.2,0.08750720024108886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,14336,2,8,8,1,power_law_1.2,0.0877888023853302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,1,balanced,0.6974720160166422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,1,balanced,0.7016692956288656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,1,power_law_1.01,0.6383423805236816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,1,power_law_1.01,0.6465727806091308
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,1,power_law_1.2,0.6487040042877197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,1,power_law_1.2,0.6608640193939209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,128,balanced,0.07484800120194753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,128,balanced,0.07796800136566162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,128,power_law_1.01,0.07414399981498718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,128,power_law_1.01,0.07601280212402343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,128,power_law_1.2,0.07587199807167053
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,128,power_law_1.2,0.07612159848213196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,16,balanced,0.10931733250617981
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,16,balanced,0.11029332876205444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,16,power_law_1.01,0.10595840215682983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,16,power_law_1.01,0.11040639877319336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,16,power_law_1.2,0.10810879468917847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,16,power_law_1.2,0.1099392056465149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,2,balanced,0.39790932337443036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,2,balanced,0.39908798535664874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,2,power_law_1.01,0.35917439460754397
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,2,power_law_1.01,0.3619071960449219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,2,power_law_1.2,0.3747904062271118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,2,power_law_1.2,0.3801919937133789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,32,balanced,0.09884267052014668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,32,balanced,0.09891200065612793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,32,power_law_1.01,0.09539200067520141
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,32,power_law_1.01,0.09779840111732482
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,32,power_law_1.2,0.09610880017280579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,32,power_law_1.2,0.09681280255317688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,4,balanced,0.22854934136072794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,4,balanced,0.22959466775258383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,4,power_law_1.01,0.22120959758758546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,4,power_law_1.01,0.22403199672698976
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,4,power_law_1.2,0.2243135929107666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,4,power_law_1.2,0.22545280456542968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,64,balanced,0.08180800080299377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,64,balanced,0.08474666873613994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,64,power_law_1.01,0.08300160169601441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,64,power_law_1.01,0.08609279990196228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,64,power_law_1.2,0.08197759985923767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,64,power_law_1.2,0.08268799781799316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,8,balanced,0.15844266613324484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,8,balanced,0.15902400016784668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,8,power_law_1.01,0.15607680082321168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,8,power_law_1.01,0.156876802444458
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,8,power_law_1.2,0.15529600381851197
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,1,8,power_law_1.2,0.15852799415588378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,2,1,balanced,0.24013332525889078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,2,1,balanced,0.24093866348266602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,2,1,power_law_1.01,0.2256256103515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,2,1,power_law_1.01,0.228057599067688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,2,1,power_law_1.2,0.23066239356994628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,2,1,power_law_1.2,0.23098878860473632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,4,1,balanced,0.16022933522860208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,4,1,balanced,0.160970667997996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,4,1,power_law_1.01,0.15319679975509642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,4,1,power_law_1.01,0.1543552041053772
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,4,1,power_law_1.2,0.1560320019721985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,1536,8,128,4,1,power_law_1.2,0.15612800121307374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,1,balanced,4.402432123819987
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,1,balanced,4.402682622273763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,1,power_law_1.01,3.6954368591308593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,1,power_law_1.01,3.732857513427734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,1,power_law_1.2,3.723603057861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,1,power_law_1.2,3.7441726684570313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,128,balanced,0.27725332975387573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,128,balanced,0.2781920035680135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,128,power_law_1.01,0.27180159091949463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,128,power_law_1.01,0.2769536018371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,128,power_law_1.2,0.2748800039291382
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,128,power_law_1.2,0.27511680126190186
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,16,balanced,0.514352003733317
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,16,balanced,0.5168266693751017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,16,power_law_1.01,0.4916736125946045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,16,power_law_1.01,0.4993408203125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,16,power_law_1.2,0.47944321632385256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,16,power_law_1.2,0.4904895782470703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,2,balanced,2.326378663380941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,2,balanced,2.331077257792155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,2,power_law_1.01,2.0267200469970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,2,power_law_1.01,2.0739839553833006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,2,power_law_1.2,1.9980159759521485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,2,power_law_1.2,2.0372928619384765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,256,balanced,0.25919467210769653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,256,balanced,0.26096532742182416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,256,power_law_1.01,0.25880959033966067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,256,power_law_1.01,0.26010880470275877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,256,power_law_1.2,0.2599744081497192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,256,power_law_1.2,0.260915207862854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,32,balanced,0.3808853228886922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,32,balanced,0.38204801082611084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,32,power_law_1.01,0.3690687894821167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,32,power_law_1.01,0.37939839363098143
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,32,power_law_1.2,0.3695296049118042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,32,power_law_1.2,0.3698944091796875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,4,balanced,1.2951306502024333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,4,balanced,1.29749329884847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,4,power_law_1.01,1.1486720085144042
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,4,power_law_1.01,1.1508352279663085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,4,power_law_1.2,1.121548843383789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,4,power_law_1.2,1.1551808357238769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,64,balanced,0.31625600655873615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,64,balanced,0.3162720004717509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,64,power_law_1.01,0.3104448080062866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,64,power_law_1.01,0.31570560932159425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,64,power_law_1.2,0.3076159954071045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,64,power_law_1.2,0.31087360382080076
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,8,balanced,0.7813386917114258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,8,balanced,0.7818559805552164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,8,power_law_1.01,0.7078271865844726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,8,power_law_1.01,0.7199359893798828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,8,power_law_1.2,0.6946047782897949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,4096,2688,22,512,1,8,power_law_1.2,0.7136127948760986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,1,balanced,0.758570671081543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,1,balanced,0.7592639923095703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,1,power_law_1.01,0.7598847866058349
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,1,power_law_1.01,0.7760704040527344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,1,power_law_1.2,0.7741951942443848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,1,power_law_1.2,0.7846911907196045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,2,balanced,0.4357279936472575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,2,balanced,0.4364159901936849
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,2,power_law_1.01,0.45235838890075686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,2,power_law_1.01,0.4614016056060791
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,2,power_law_1.2,0.4521471977233887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,2,power_law_1.2,0.4522496223449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,4,balanced,0.3176640073458354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,4,balanced,0.32235199213027954
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,4,power_law_1.01,0.3187391996383667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,4,power_law_1.01,0.34476799964904786
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,4,power_law_1.2,0.33749120235443114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,4,power_law_1.2,0.35525760650634763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,8,balanced,0.2678239941596985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,8,balanced,0.26816000541051227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,8,power_law_1.01,0.26397440433502195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,8,power_law_1.01,0.27279999256134035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,8,power_law_1.2,0.28886399269104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,1,8,power_law_1.2,0.28908159732818606
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,16,1,balanced,0.10831999778747559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,16,1,balanced,0.109333336353302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,16,1,power_law_1.01,0.10597120523452759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,16,1,power_law_1.01,0.10689280033111573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,16,1,power_law_1.2,0.10594559907913208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,16,1,power_law_1.2,0.10631040334701539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,2,1,balanced,0.4199093182881673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,2,1,balanced,0.42022931575775146
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,2,1,power_law_1.01,0.41619200706481935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,2,1,power_law_1.01,0.41822080612182616
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,2,1,power_law_1.2,0.4187647819519043
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,2,1,power_law_1.2,0.42344322204589846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,32,1,balanced,0.09166399637858073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,32,1,balanced,0.09184533357620239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,32,1,power_law_1.01,0.08916479945182801
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,32,1,power_law_1.01,0.08950399756431579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,32,1,power_law_1.2,0.0877888023853302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,32,1,power_law_1.2,0.08925439715385437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,4,1,balanced,0.22649067640304565
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,4,1,balanced,0.25463465849558514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,4,1,power_law_1.01,0.22558720111846925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,4,1,power_law_1.01,0.22608640193939208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,4,1,power_law_1.2,0.22529280185699463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,4,1,power_law_1.2,0.22787840366363527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,8,1,balanced,0.13142933448155722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,8,1,balanced,0.13238400220870972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,8,1,power_law_1.01,0.13133440017700196
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,8,1,power_law_1.01,0.131494402885437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,8,1,power_law_1.2,0.12911360263824462
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,16384,2,8,8,1,power_law_1.2,0.12946560382843017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,1,balanced,2.5271147092183432
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,1,balanced,2.5283360481262207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,1,power_law_1.01,2.0137727737426756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,1,power_law_1.01,2.021004867553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,1,power_law_1.2,1.9430976867675782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,1,power_law_1.2,2.011916732788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,128,balanced,0.15763733784357706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,128,balanced,0.1595039963722229
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,128,power_law_1.01,0.15542399883270264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,128,power_law_1.01,0.15679359436035156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,128,power_law_1.2,0.1572864055633545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,128,power_law_1.2,0.15773439407348633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,16,balanced,0.28756799300511676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,16,balanced,0.28757866223653156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,16,power_law_1.01,0.26317439079284666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,16,power_law_1.01,0.26513280868530276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,16,power_law_1.2,0.2611840009689331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,16,power_law_1.2,0.2679935932159424
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,2,balanced,1.324837366739909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,2,balanced,1.3248426914215088
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,2,power_law_1.01,1.0660096168518067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,2,power_law_1.01,1.1271103858947753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,2,power_law_1.2,1.101036834716797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,2,power_law_1.2,1.1218367576599122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,256,balanced,0.14364799857139587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,256,balanced,0.14481600125630698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,256,power_law_1.01,0.14252159595489503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,256,power_law_1.01,0.15111680030822755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,256,power_law_1.2,0.14242559671401978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,256,power_law_1.2,0.1425920009613037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,32,balanced,0.21180800596872965
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,32,balanced,0.2120586633682251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,32,power_law_1.01,0.20217599868774414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,32,power_law_1.01,0.20238080024719238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,32,power_law_1.2,0.18184319734573365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,32,power_law_1.2,0.19803520441055297
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,4,balanced,0.736741304397583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,4,balanced,0.7379786968231201
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,4,power_law_1.01,0.6253503799438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,4,power_law_1.01,0.6442944049835205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,4,power_law_1.2,0.6337664127349854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,4,power_law_1.2,0.6519423961639405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,64,balanced,0.17242133617401123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,64,balanced,0.1727679967880249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,64,power_law_1.01,0.1700096011161804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,64,power_law_1.01,0.17022720575332642
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,64,power_law_1.2,0.16696319580078126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,64,power_law_1.2,0.17036160230636596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,8,balanced,0.250602662563324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,8,balanced,0.2512106696764628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,8,power_law_1.01,0.23024001121520996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,8,power_law_1.01,0.23712639808654784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,8,power_law_1.2,0.2171072006225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,1,8,power_law_1.2,0.23235840797424318
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,16,1,balanced,0.3370506763458252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,16,1,balanced,0.33847999572753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,16,1,power_law_1.01,0.303110408782959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,16,1,power_law_1.01,0.3040640115737915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,16,1,power_law_1.2,0.30207359790802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,16,1,power_law_1.2,0.3028736114501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,2,1,balanced,1.3443093299865723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,2,1,balanced,1.344373385111491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,2,1,power_law_1.01,1.0694080352783204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,2,1,power_law_1.01,1.0729791641235351
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,2,1,power_law_1.2,1.0597951889038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,2,1,power_law_1.2,1.0886783599853516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,4,1,balanced,0.45798933506011963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,4,1,balanced,0.4584159851074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,4,1,power_law_1.01,0.3635135889053345
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,4,1,power_law_1.01,0.3659071922302246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,4,1,power_law_1.2,0.36487040519714353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,4,1,power_law_1.2,0.36497280597686765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,8,1,balanced,0.3083413243293762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,8,1,balanced,0.3151093324025472
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,8,1,power_law_1.01,0.2211456060409546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,8,1,power_law_1.01,0.2271807909011841
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,8,1,power_law_1.2,0.22062079906463622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2048,8,256,8,1,power_law_1.2,0.22490239143371582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,1,balanced,1.993226687113444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,1,balanced,1.9945173263549805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,1,power_law_1.01,1.7337791442871093
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,1,power_law_1.01,1.748307228088379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,1,power_law_1.2,1.7658367156982422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,1,power_law_1.2,1.7893760681152344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,16,balanced,0.23456533749898276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,16,balanced,0.2359573245048523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,16,power_law_1.01,0.2264319896697998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,16,power_law_1.01,0.22851839065551757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,16,power_law_1.2,0.2313983917236328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,16,power_law_1.2,0.23197441101074218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,2,balanced,1.0437013308207195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,2,balanced,1.0454880396525066
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,2,power_law_1.01,0.936070442199707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,2,power_law_1.01,0.9587967872619629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,2,power_law_1.2,0.9300992012023925
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,2,power_law_1.2,0.964352035522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,32,balanced,0.164192001024882
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,32,balanced,0.16497600078582764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,32,power_law_1.01,0.16165119409561157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,32,power_law_1.01,0.16168320178985596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,32,power_law_1.2,0.1596735954284668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,32,power_law_1.2,0.16183040142059327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,4,balanced,0.36692798137664795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,4,balanced,0.36735999584198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,4,power_law_1.01,0.3388159990310669
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,4,power_law_1.01,0.34187519550323486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,4,power_law_1.2,0.3413248062133789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,4,power_law_1.2,0.34240639209747314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,8,balanced,0.24633065859476724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,8,balanced,0.24773865938186646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,8,power_law_1.01,0.22298879623413087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,8,power_law_1.01,0.23350400924682618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,8,power_law_1.2,0.21674880981445313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,1,8,power_law_1.2,0.22663679122924804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,2,1,balanced,1.054517348607381
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,2,1,balanced,1.0571520328521729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,2,1,power_law_1.01,0.9498047828674316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,2,1,power_law_1.01,0.9539392471313477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,2,1,power_law_1.2,0.9437760353088379
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,2,1,power_law_1.2,0.9472640037536622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,4,1,balanced,0.35818668206532794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,4,1,balanced,0.35920000076293945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,4,1,power_law_1.01,0.3275968074798584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,4,1,power_law_1.01,0.3314687967300415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,4,1,power_law_1.2,0.3317823886871338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,6144,2560,8,160,4,1,power_law_1.2,0.33376638889312743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,1,balanced,2.9461278915405273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,1,balanced,2.9462451934814453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,1,power_law_1.01,2.3009408950805663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,1,power_law_1.01,2.349849510192871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,1,power_law_1.2,2.2860671997070314
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,1,power_law_1.2,2.315475273132324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,128,balanced,0.18062400817871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,128,balanced,0.1827413241068522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,128,power_law_1.01,0.17882239818572998
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,128,power_law_1.01,0.17989120483398438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,128,power_law_1.2,0.18005119562149047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,128,power_law_1.2,0.18012160062789917
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,16,balanced,0.3235519925753276
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,16,balanced,0.32425065835316974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,16,power_law_1.01,0.3069119930267334
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,16,power_law_1.01,0.30792319774627686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,16,power_law_1.2,0.30286080837249757
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,16,power_law_1.2,0.30687999725341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,2,balanced,1.5379145940144856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,2,balanced,1.5392212867736816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,2,power_law_1.01,1.2630784034729003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,2,power_law_1.01,1.2976767539978027
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,2,power_law_1.2,1.21331844329834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,2,power_law_1.2,1.2389632225036622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,256,balanced,0.161381334066391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,256,balanced,0.17284266153971353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,256,power_law_1.01,0.16083840131759644
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,256,power_law_1.01,0.1696768045425415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,256,power_law_1.2,0.16267520189285278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,256,power_law_1.2,0.163264000415802
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,32,balanced,0.23591466744740805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,32,balanced,0.2360373338063558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,32,power_law_1.01,0.22329599857330323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,32,power_law_1.01,0.23116800785064698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,32,power_law_1.2,0.21444480419158934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,32,power_law_1.2,0.22697598934173585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,4,balanced,0.8497973283131918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,4,balanced,0.8504693508148193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,4,power_law_1.01,0.7473919868469239
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,4,power_law_1.01,0.7641664028167725
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,4,power_law_1.2,0.7084928035736084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,4,power_law_1.2,0.7424704074859619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,64,balanced,0.19271467129389444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,64,balanced,0.19508800903956094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,64,power_law_1.01,0.19011839628219604
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,64,power_law_1.01,0.19148800373077393
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,64,power_law_1.2,0.19104000329971313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,64,power_law_1.2,0.19278719425201415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,8,balanced,0.2906186580657959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,8,balanced,0.2910719911257426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,8,power_law_1.01,0.25560319423675537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,8,power_law_1.01,0.26545279026031493
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,8,power_law_1.2,0.27146239280700685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,1,8,power_law_1.2,0.2773184061050415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,16,1,balanced,0.3885546525319417
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,16,1,balanced,0.38860801855723065
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,16,1,power_law_1.01,0.34904959201812746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,16,1,power_law_1.01,0.3503040075302124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,16,1,power_law_1.2,0.3465280055999756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,16,1,power_law_1.2,0.3486783981323242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,2,1,balanced,1.5636000633239746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,2,1,balanced,1.5636372566223145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,2,1,power_law_1.01,1.2442432403564454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,2,1,power_law_1.01,1.2499839782714843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,2,1,power_law_1.2,1.219711971282959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,2,1,power_law_1.2,1.2270079612731934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,4,1,balanced,0.5316160122553507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,4,1,balanced,0.5346133311589559
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,4,1,power_law_1.01,0.42200322151184083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,4,1,power_law_1.01,0.42421760559082033
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,4,1,power_law_1.2,0.41502718925476073
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,4,1,power_law_1.2,0.41685757637023924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,8,1,balanced,0.34218132495880127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,8,1,balanced,0.347327987353007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,8,1,power_law_1.01,0.25248639583587645
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,8,1,power_law_1.01,0.25562880039215086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,8,1,power_law_1.2,0.2504703998565674
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,256,8,1,power_law_1.2,0.25384318828582764
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,1,balanced,4.369450569152832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,1,balanced,4.372058550516765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,1,power_law_1.01,3.0957632064819336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,1,power_law_1.01,3.141804885864258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,1,power_law_1.2,2.981452751159668
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,1,power_law_1.2,3.043692779541016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,128,balanced,0.23224000136057535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,128,balanced,0.23227733373641968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,128,power_law_1.01,0.23079679012298585
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,128,power_law_1.01,0.23220479488372803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,128,power_law_1.2,0.23009281158447265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,128,power_law_1.2,0.23013761043548583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,16,balanced,0.46376001834869385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,16,balanced,0.4650239944458008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,16,power_law_1.01,0.430463981628418
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,16,power_law_1.01,0.4385983943939209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,16,power_law_1.2,0.4236735820770264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,16,power_law_1.2,0.4290112018585205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,2,balanced,2.277525266011556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,2,balanced,2.327573299407959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,2,power_law_1.01,1.6461376190185546
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,2,power_law_1.01,1.664543914794922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,2,power_law_1.2,1.7268863677978517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,2,power_law_1.2,1.733907127380371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,32,balanced,0.3347146511077881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,32,balanced,0.33534399668375653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,32,power_law_1.01,0.31000959873199463
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,32,power_law_1.01,0.3116352081298828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,32,power_law_1.2,0.30910720825195315
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,32,power_law_1.2,0.31086719036102295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,4,balanced,1.2444693247477214
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,4,balanced,1.2479146321614583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,4,power_law_1.01,1.054310417175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,4,power_law_1.01,1.0845376014709474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,4,power_law_1.2,1.0078911781311035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,4,power_law_1.2,1.03755521774292
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,64,balanced,0.26501333713531494
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,64,balanced,0.26637866099675495
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,64,power_law_1.01,0.2565056085586548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,64,power_law_1.01,0.2567487955093384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,64,power_law_1.2,0.2506432056427002
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,64,power_law_1.2,0.2596415996551514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,8,balanced,0.72980268796285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,8,balanced,0.7299253145853678
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,8,power_law_1.01,0.6322112083435059
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,8,power_law_1.01,0.6761792182922364
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,8,power_law_1.2,0.6264639854431152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,1,8,power_law_1.2,0.6506688117980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,16,1,balanced,0.3122719923655192
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,16,1,balanced,0.32051199674606323
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,16,1,power_law_1.01,0.21624319553375243
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,16,1,power_law_1.01,0.21709439754486085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,16,1,power_law_1.2,0.20937600135803222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,16,1,power_law_1.2,0.21663360595703124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,2,1,balanced,2.3551252683003745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,2,1,balanced,2.3699466387430825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,2,1,power_law_1.01,1.6375616073608399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,2,1,power_law_1.01,1.6786239624023438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,2,1,power_law_1.2,1.595961570739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,2,1,power_law_1.2,1.6447296142578125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,4,1,balanced,1.3093866507212322
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,4,1,balanced,1.3102453549702961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,4,1,power_law_1.01,0.9754624366760254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,4,1,power_law_1.01,0.9765312194824218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,4,1,power_law_1.2,0.9290495872497558
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,4,1,power_law_1.2,0.9513792037963867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,8,1,balanced,0.4530826807022095
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,8,1,balanced,0.453109343846639
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,8,1,power_law_1.01,0.3223743915557861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,8,1,power_law_1.01,0.3224319934844971
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,8,1,power_law_1.2,0.3173376083374023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,80,7168,2048,8,384,8,1,power_law_1.2,0.3185728073120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,1,balanced,1.6977386474609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,1,balanced,1.6977492968241374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,1,power_law_1.01,1.6816255569458007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,1,power_law_1.01,1.6856447219848634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,1,power_law_1.2,1.6853439331054687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,1,power_law_1.2,1.6860671997070313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,128,balanced,0.6254453261693319
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,128,balanced,0.6255573431650797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,128,power_law_1.01,0.6922880172729492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,128,power_law_1.01,0.7001471996307373
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,128,power_law_1.2,0.7409535884857178
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,128,power_law_1.2,0.7449471950531006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,16,balanced,0.6908906300862631
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,16,balanced,0.6920533180236816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,16,power_law_1.01,0.7905151844024658
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,16,power_law_1.01,0.7912767887115478
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,16,power_law_1.2,0.8335743904113769
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,16,power_law_1.2,0.8502079963684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,2,balanced,1.2177973588307698
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,2,balanced,1.2181599934895833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,2,power_law_1.01,1.261567974090576
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,2,power_law_1.01,1.284921646118164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,2,power_law_1.2,1.2740544319152831
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,2,power_law_1.2,1.282419204711914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,32,balanced,0.6552426815032959
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,32,balanced,0.6555786530176798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,32,power_law_1.01,0.7488383769989013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,32,power_law_1.01,0.7530496120452881
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,32,power_law_1.2,0.7834688186645508
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,32,power_law_1.2,0.7889088153839111
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,4,balanced,0.9176906744639078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,4,balanced,0.9189759890238444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,4,power_law_1.01,1.0171392440795899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,4,power_law_1.01,1.017471981048584
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,4,power_law_1.2,1.0493696212768555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,4,power_law_1.2,1.0539456367492677
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,64,balanced,0.6354879935582479
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,64,balanced,0.6368319988250732
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,64,power_law_1.01,0.7049407958984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,64,power_law_1.01,0.7068992137908936
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,64,power_law_1.2,0.7449215888977051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,64,power_law_1.2,0.7620160102844238
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,8,balanced,0.7682240009307861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,8,balanced,0.7690719763437907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,8,power_law_1.01,0.8659711837768554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,8,power_law_1.01,0.893984031677246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,8,power_law_1.2,0.9028863906860352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,1,8,power_law_1.2,0.9118847846984863
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,2,1,balanced,1.0308960278828938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,2,1,balanced,1.033141295115153
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,2,1,power_law_1.01,1.0477696418762208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,2,1,power_law_1.01,1.0494144439697266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,2,1,power_law_1.2,1.0439295768737793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,2048,768,8,128,2,1,power_law_1.2,1.0496576309204102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,1,balanced,4.302186648050944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,1,balanced,4.303152084350586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,1,power_law_1.01,4.645926284790039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,1,power_law_1.01,4.664780807495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,1,power_law_1.2,4.622387313842774
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,1,power_law_1.2,4.642086410522461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,128,balanced,1.0444213549296062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,128,balanced,1.0446666876475017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,128,power_law_1.01,1.149068832397461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,128,power_law_1.01,1.165503978729248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,128,power_law_1.2,1.2166208267211913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,128,power_law_1.2,1.2863231658935548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,16,balanced,1.233850638071696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,16,balanced,1.2366453011830647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,16,power_law_1.01,1.4260543823242187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,16,power_law_1.01,1.442131233215332
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,16,power_law_1.2,1.4425151824951172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,16,power_law_1.2,1.5063488006591796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,2,balanced,2.7229652404785156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,2,balanced,2.725189208984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,2,power_law_1.01,3.0224000930786135
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,2,power_law_1.01,3.0752895355224608
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,2,power_law_1.2,3.0623231887817384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,2,power_law_1.2,3.1182464599609374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,256,balanced,1.028714656829834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,256,balanced,1.030197302500407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,256,power_law_1.01,1.1310144424438477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,256,power_law_1.01,1.1326592445373536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,256,power_law_1.2,1.2087679862976075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,256,power_law_1.2,1.2162816047668457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,32,balanced,1.1243840058644612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,32,balanced,1.124714692433675
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,32,power_law_1.01,1.2875840187072753
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,32,power_law_1.01,1.3014592170715331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,32,power_law_1.2,1.3987199783325195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,32,power_law_1.2,1.4287936210632324
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,4,balanced,1.874608039855957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,4,balanced,1.8771519660949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,4,power_law_1.01,2.093337631225586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,4,power_law_1.01,2.127801513671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,4,power_law_1.2,2.309548759460449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,4,power_law_1.2,2.3477439880371094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,64,balanced,1.0712160269419353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,64,balanced,1.0728800296783447
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,64,power_law_1.01,1.2125311851501466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,64,power_law_1.01,1.217363166809082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,64,power_law_1.2,1.322003173828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,64,power_law_1.2,1.3417216300964356
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,8,balanced,1.4468107223510742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,8,balanced,1.447146733601888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,8,power_law_1.01,1.6351423263549805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,8,power_law_1.01,1.6860927581787108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,8,power_law_1.2,1.809939193725586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,1,8,power_law_1.2,1.8498367309570312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,2,1,balanced,2.464730739593506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,2,1,balanced,2.4670507113138833
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,2,1,power_law_1.01,2.6107200622558593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,2,1,power_law_1.01,2.6215744018554688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,2,1,power_law_1.2,2.6199487686157226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,2,1,power_law_1.2,2.620966339111328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,4,1,balanced,1.5185866355895996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,4,1,balanced,1.5194932619730632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,4,1,power_law_1.01,1.6125312805175782
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,4,1,power_law_1.01,1.614521598815918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,4,1,power_law_1.2,1.6104127883911132
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,3072,1536,8,256,4,1,power_law_1.2,1.613382339477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,1,balanced,10.562143961588541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,1,balanced,10.580133438110352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,1,power_law_1.01,10.974809265136718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,1,power_law_1.01,11.01317138671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,1,power_law_1.2,10.963314819335938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,1,power_law_1.2,10.998445129394531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,2,balanced,6.155514399210612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,2,balanced,6.15667724609375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,2,power_law_1.01,8.149337768554688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,2,power_law_1.01,8.210739135742188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,2,power_law_1.2,7.784780883789063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,2,power_law_1.2,8.832595062255859
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,4,balanced,3.9041547775268555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,4,balanced,3.905344009399414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,4,power_law_1.01,6.220678329467773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,4,power_law_1.01,6.561504364013672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,4,power_law_1.2,6.031481552124023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,4,power_law_1.2,6.332332611083984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,8,balanced,2.7965332667032876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,8,balanced,2.799663861592611
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,8,power_law_1.01,5.844921493530274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,8,power_law_1.01,5.874265670776367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,8,power_law_1.2,5.644607925415039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,1,8,power_law_1.2,6.155551910400391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,16,1,balanced,0.9004480044047037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,16,1,balanced,0.9027199745178223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,16,1,power_law_1.01,0.8740287780761719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,16,1,power_law_1.01,0.8818943977355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,16,1,power_law_1.2,0.8769087791442871
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,16,1,power_law_1.2,0.8794816017150879
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,2,1,balanced,5.321845372517903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,2,1,balanced,5.324874560038249
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,2,1,power_law_1.01,5.441247940063477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,2,1,power_law_1.01,5.461331176757812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,2,1,power_law_1.2,5.457830429077148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,2,1,power_law_1.2,5.47125129699707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,4,1,balanced,2.789408047993978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,4,1,balanced,2.7908480962117515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,4,1,power_law_1.01,2.8056512832641602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,4,1,power_law_1.01,2.805824089050293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,4,1,power_law_1.2,2.806438446044922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,4,1,power_law_1.2,2.8095935821533202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,8,1,balanced,1.5340159734090169
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,8,1,balanced,1.5347199440002441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,8,1,power_law_1.01,1.4872320175170899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,8,1,power_law_1.01,1.5025792121887207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,8,1,power_law_1.2,1.4883904457092285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,14336,2,8,8,1,power_law_1.2,1.4932928085327148
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,1,balanced,5.3035093943278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,1,balanced,5.307392120361328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,1,power_law_1.01,5.3767742156982425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,1,power_law_1.01,5.391033554077149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,1,power_law_1.2,5.315948867797852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,1,power_law_1.2,5.324665451049805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,128,balanced,1.1495733261108398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,128,balanced,1.1522826353708904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,128,power_law_1.01,1.3894975662231446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,128,power_law_1.01,1.4240703582763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,128,power_law_1.2,1.5133824348449707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,128,power_law_1.2,1.5947327613830566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,16,balanced,1.3916160265604656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,16,balanced,1.3929492632548015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,16,power_law_1.01,1.6867904663085938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,16,power_law_1.01,1.6932992935180664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,16,power_law_1.2,1.8722047805786133
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,16,power_law_1.2,1.9198911666870118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,2,balanced,3.29478391011556
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,2,balanced,3.2956212361653647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,2,power_law_1.01,3.5975296020507814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,2,power_law_1.01,3.6347007751464844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,2,power_law_1.2,3.591059112548828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,2,power_law_1.2,3.708607864379883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,32,balanced,1.2521493434906006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,32,balanced,1.2557120323181152
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,32,power_law_1.01,1.546233558654785
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,32,power_law_1.01,1.5767807960510254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,32,power_law_1.2,1.7426944732666017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,32,power_law_1.2,1.818943977355957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,4,balanced,2.211322625478109
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,4,balanced,2.212735970815023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,4,power_law_1.01,2.631679916381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,4,power_law_1.01,2.6357887268066404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,4,power_law_1.2,2.6833984375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,4,power_law_1.2,2.685152053833008
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,64,balanced,1.1830399831136067
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,64,balanced,1.1874453226725261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,64,power_law_1.01,1.432863998413086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,64,power_law_1.01,1.5168000221252442
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,64,power_law_1.2,1.569215965270996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,64,power_law_1.2,1.6361919403076173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,8,balanced,1.6670400301615398
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,8,balanced,1.667199929555257
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,8,power_law_1.01,2.0436351776123045
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,8,power_law_1.01,2.15338249206543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,8,power_law_1.2,2.104787254333496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,1,8,power_law_1.2,2.1645952224731446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,2,1,balanced,3.0157972971598306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,2,1,balanced,3.0220371882120767
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,2,1,power_law_1.01,2.9587263107299804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,2,1,power_law_1.01,2.9691776275634765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,2,1,power_law_1.2,2.965004730224609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,2,1,power_law_1.2,2.9726335525512697
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,4,1,balanced,1.8448106447855632
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,4,1,balanced,1.8463999430338542
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,4,1,power_law_1.01,1.8723199844360352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,4,1,power_law_1.01,1.8757375717163085
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,4,1,power_law_1.2,1.8687488555908203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,1536,8,128,4,1,power_law_1.2,1.8689855575561523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,1,balanced,26.04145050048828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,1,balanced,26.052401224772137
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,1,power_law_1.01,26.008428955078124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,1,power_law_1.01,26.022610473632813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,1,power_law_1.2,25.830111694335937
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,1,power_law_1.2,25.868743896484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,128,balanced,4.301098823547363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,128,balanced,4.3075253168741865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,128,power_law_1.01,4.763654327392578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,128,power_law_1.01,4.796870422363281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,128,power_law_1.2,5.029324722290039
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,128,power_law_1.2,5.151411056518555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,16,balanced,5.53769048055013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,16,balanced,5.547701517740886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,16,power_law_1.01,6.247507095336914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,16,power_law_1.01,6.283327865600586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,16,power_law_1.2,6.6659393310546875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,16,power_law_1.2,6.712268829345703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,2,balanced,15.298751831054688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,2,balanced,15.302735646565756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,2,power_law_1.01,15.860890197753907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,2,power_law_1.01,16.54131164550781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,2,power_law_1.2,15.560954284667968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,2,power_law_1.2,16.561056518554686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,256,balanced,4.214607874552409
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,256,balanced,4.2276105880737305
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,256,power_law_1.01,4.603590393066407
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,256,power_law_1.01,4.621676635742188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,256,power_law_1.2,4.907020950317383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,256,power_law_1.2,4.951039886474609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,32,balanced,4.834277470906575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,32,balanced,4.834949175516765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,32,power_law_1.01,5.477107238769531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,32,power_law_1.01,5.56360969543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,32,power_law_1.2,5.876595306396484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,32,power_law_1.2,5.878822326660156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,4,balanced,9.734965642293295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,4,balanced,9.738794962565104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,4,power_law_1.01,10.39838104248047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,4,power_law_1.01,10.642259216308593
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,4,power_law_1.2,10.455980682373047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,4,power_law_1.2,10.917056274414062
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,64,balanced,4.479669253031413
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,64,balanced,4.500010808308919
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,64,power_law_1.01,5.065644836425781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,64,power_law_1.01,5.142758560180664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,64,power_law_1.2,5.342854309082031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,64,power_law_1.2,5.661433410644531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,8,balanced,6.9462025960286455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,8,balanced,6.9642079671223955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,8,power_law_1.01,7.687852478027343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,8,power_law_1.01,7.795891571044922
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,8,power_law_1.2,8.216352081298828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,4096,2688,22,512,1,8,power_law_1.2,8.315328216552734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,1,balanced,17.24305597941081
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,1,balanced,17.247365315755207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,1,power_law_1.01,17.72662353515625
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,1,power_law_1.01,17.738694763183595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,1,power_law_1.2,17.630534362792968
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,1,power_law_1.2,17.784275817871094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,2,balanced,9.588213602701822
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,2,balanced,9.589594523111979
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,2,power_law_1.01,12.385420989990234
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,2,power_law_1.01,14.511564636230469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,2,power_law_1.2,12.372019195556641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,2,power_law_1.2,13.323898315429688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,4,balanced,5.786474863688151
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,4,balanced,5.788592020670573
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,4,power_law_1.01,11.676249694824218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,4,power_law_1.01,9.262406158447266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,4,power_law_1.2,10.130105590820312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,4,power_law_1.2,11.354688262939453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,8,balanced,3.8809601465861
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,8,balanced,3.884474754333496
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,8,power_law_1.01,8.035456085205078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,8,power_law_1.01,9.225753784179688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,8,power_law_1.2,9.086752319335938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,1,8,power_law_1.2,9.403014373779296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,16,1,balanced,1.4221067428588867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,16,1,balanced,1.4248372713724773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,16,1,power_law_1.01,1.368876838684082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,16,1,power_law_1.01,1.371020793914795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,16,1,power_law_1.2,1.3601152420043945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,16,1,power_law_1.2,1.3652416229248048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,2,1,balanced,8.59504508972168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,2,1,balanced,8.611189524332682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,2,1,power_law_1.01,8.807552337646484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,2,1,power_law_1.01,8.866809844970703
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,2,1,power_law_1.2,8.81775360107422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,2,1,power_law_1.2,8.840211486816406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,32,1,balanced,0.9031999905904134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,32,1,balanced,0.9036426544189453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,32,1,power_law_1.01,0.8777728080749512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,32,1,power_law_1.01,0.8790399551391601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,32,1,power_law_1.2,0.877177619934082
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,32,1,power_law_1.2,0.8852160453796387
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,4,1,balanced,4.482416152954102
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,4,1,balanced,4.4833065668741865
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,4,1,power_law_1.01,4.572415924072265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,4,1,power_law_1.01,4.591398239135742
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,4,1,power_law_1.2,4.580928039550781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,4,1,power_law_1.2,4.59051513671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,8,1,balanced,2.4400854110717773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,8,1,balanced,2.443391958872477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,8,1,power_law_1.01,2.4402944564819338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,8,1,power_law_1.01,2.4436479568481446
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,8,1,power_law_1.2,2.4255615234375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,16384,2,8,8,1,power_law_1.2,2.4368576049804687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,1,balanced,10.088293075561523
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,1,balanced,10.089103698730469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,1,power_law_1.01,11.176870727539063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,1,power_law_1.01,11.203846740722657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,1,power_law_1.2,11.224979400634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,1,power_law_1.2,11.227008056640624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,128,balanced,1.663599967956543
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,128,balanced,1.668085257212321
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,128,power_law_1.01,1.9634111404418946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,128,power_law_1.01,2.0163135528564453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,128,power_law_1.2,2.135116767883301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,128,power_law_1.2,2.208665657043457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,16,balanced,2.1483519872029624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,16,balanced,2.1558240254720054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,16,power_law_1.01,2.6656000137329103
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,16,power_law_1.01,2.743827247619629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,16,power_law_1.2,2.9396352767944336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,16,power_law_1.2,2.9830463409423826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,2,balanced,5.9627736409505205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,2,balanced,5.967957178751628
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,2,power_law_1.01,6.860147094726562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,2,power_law_1.01,7.036851501464843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,2,power_law_1.2,7.047398376464844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,2,power_law_1.2,7.177702331542969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,256,balanced,1.629317283630371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,256,balanced,1.6308693885803223
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,256,power_law_1.01,1.853977584838867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,256,power_law_1.01,1.9014400482177733
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,256,power_law_1.2,2.158380889892578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,256,power_law_1.2,2.1994112014770506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,32,balanced,1.871338685353597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,32,balanced,1.8733545939127605
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,32,power_law_1.01,2.2925567626953125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,32,power_law_1.01,2.309574317932129
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,32,power_law_1.2,2.4407167434692383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,32,power_law_1.2,2.6277952194213867
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,4,balanced,3.7932052612304688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,4,balanced,3.798842748006185
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,4,power_law_1.01,4.497427368164063
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,4,power_law_1.01,4.645708847045898
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,4,power_law_1.2,4.532633590698242
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,4,power_law_1.2,4.8130943298339846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,64,balanced,1.733583927154541
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,64,balanced,1.7371519406636555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,64,power_law_1.01,2.086649513244629
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,64,power_law_1.01,2.1330175399780273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,64,power_law_1.2,2.2920576095581056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,64,power_law_1.2,2.3129344940185548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,8,balanced,2.600213368733724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,8,balanced,2.6047840118408203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,8,power_law_1.01,3.1627775192260743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,8,power_law_1.01,3.210291290283203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,8,power_law_1.2,3.406079864501953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,1,8,power_law_1.2,3.499692916870117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,16,1,balanced,1.6992479960123699
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,16,1,balanced,1.6993120511372883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,16,1,power_law_1.01,1.8228288650512696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,16,1,power_law_1.01,1.830771255493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,16,1,power_law_1.2,1.8300863265991212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,16,1,power_law_1.2,1.8387712478637694
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,2,1,balanced,5.5658721923828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,2,1,balanced,5.566165288289388
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,2,1,power_law_1.01,6.095571136474609
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,2,1,power_law_1.01,6.1021888732910154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,2,1,power_law_1.2,6.087321472167969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,2,1,power_law_1.2,6.108415985107422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,4,1,balanced,3.2209599812825522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,4,1,balanced,3.2211573918660483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,4,1,power_law_1.01,3.508006286621094
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,4,1,power_law_1.01,3.5159488677978517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,4,1,power_law_1.2,3.540083312988281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,4,1,power_law_1.2,3.5468414306640623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,8,1,balanced,4.401583989461263
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,8,1,balanced,4.408378601074219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,8,1,power_law_1.01,4.5517120361328125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,8,1,power_law_1.01,4.557056045532226
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,8,1,power_law_1.2,4.585868835449219
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2048,8,256,8,1,power_law_1.2,4.588921737670899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,1,balanced,13.025029500325521
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,1,balanced,13.042592366536459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,1,power_law_1.01,12.804722595214844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,1,power_law_1.01,12.80548553466797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,1,power_law_1.2,12.750214385986329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,1,power_law_1.2,12.795449829101562
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,16,balanced,2.47269868850708
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,16,balanced,2.4765920639038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,16,power_law_1.01,3.194207954406738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,16,power_law_1.01,3.365683364868164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,16,power_law_1.2,3.4315521240234377
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,16,power_law_1.2,3.614227294921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,2,balanced,7.504458745320638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,2,balanced,7.505840301513672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,2,power_law_1.01,7.6336509704589846
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,2,power_law_1.01,7.856006622314453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,2,power_law_1.2,8.13733139038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,2,power_law_1.2,8.40979232788086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,32,balanced,2.104309399922689
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,32,balanced,2.105583985646566
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,32,power_law_1.01,2.718227195739746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,32,power_law_1.01,2.7413759231567383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,32,power_law_1.2,3.0800384521484374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,32,power_law_1.2,3.2903553009033204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,4,balanced,4.413381258646647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,4,balanced,4.415247917175293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,4,power_law_1.01,5.146604919433594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,4,power_law_1.01,5.226591873168945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,4,power_law_1.2,5.345171356201172
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,4,power_law_1.2,5.591519927978515
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,8,balanced,3.074687957763672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,8,balanced,3.0755093892415366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,8,power_law_1.01,3.6876094818115233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,8,power_law_1.01,4.069926452636719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,8,power_law_1.2,4.058208084106445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,1,8,power_law_1.2,4.307251358032227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,2,1,balanced,7.066277186075847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,2,1,balanced,7.06656010945638
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,2,1,power_law_1.01,6.878777313232422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,2,1,power_law_1.01,6.937177276611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,2,1,power_law_1.2,6.816294097900391
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,2,1,power_law_1.2,6.816844940185547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,4,1,balanced,3.9904425938924155
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,4,1,balanced,3.9905385971069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,4,1,power_law_1.01,3.8423038482666017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,4,1,power_law_1.01,3.8523006439208984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,4,1,power_law_1.2,3.840755081176758
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,6144,2560,8,160,4,1,power_law_1.2,3.851103973388672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,1,balanced,11.614021301269531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,1,balanced,11.62444814046224
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,1,power_law_1.01,12.88805694580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,1,power_law_1.01,12.938143920898437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,1,power_law_1.2,12.972953796386719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,1,power_law_1.2,13.002450561523437
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,128,balanced,1.8034186363220215
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,128,balanced,1.8072266578674316
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,128,power_law_1.01,2.1383808135986326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,128,power_law_1.01,2.168819236755371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,128,power_law_1.2,2.4129215240478517
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,128,power_law_1.2,2.4382656097412108
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,16,balanced,2.374879995981852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,16,balanced,2.375498612721761
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,16,power_law_1.01,3.0473087310791014
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,16,power_law_1.01,3.081772804260254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,16,power_law_1.2,3.1289087295532227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,16,power_law_1.2,3.3009281158447266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,2,balanced,6.8222401936848955
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,2,balanced,6.8323516845703125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,2,power_law_1.01,7.751929473876953
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,2,power_law_1.01,8.297087860107421
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,2,power_law_1.2,8.044921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,2,power_law_1.2,8.197798156738282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,256,balanced,1.7628906567891438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,256,balanced,1.7650346755981445
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,256,power_law_1.01,2.0619327545166017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,256,power_law_1.01,2.065702438354492
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,256,power_law_1.2,2.3854400634765627
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,256,power_law_1.2,2.3921728134155273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,32,balanced,2.0525867144266763
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,32,balanced,2.0527893702189126
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,32,power_law_1.01,2.4849664688110353
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,32,power_law_1.01,2.565452766418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,32,power_law_1.2,2.8811264038085938
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,32,power_law_1.2,2.9835391998291017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,4,balanced,4.288400014241536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,4,balanced,4.29425589243571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,4,power_law_1.01,5.13322868347168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,4,power_law_1.01,5.3299518585205075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,4,power_law_1.2,5.380243301391602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,4,power_law_1.2,5.47454719543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,64,balanced,1.8873012860616047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,64,balanced,1.8931573232014973
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,64,power_law_1.01,2.2985984802246096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,64,power_law_1.01,2.3756032943725587
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,64,power_law_1.2,2.618195152282715
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,64,power_law_1.2,2.7112960815429688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,8,balanced,2.910799980163574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,8,balanced,2.9163573582967124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,8,power_law_1.01,3.5314495086669924
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,8,power_law_1.01,3.5994625091552734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,8,power_law_1.2,3.839206314086914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,1,8,power_law_1.2,4.099468612670899
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,16,1,balanced,1.9593173662821453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,16,1,balanced,1.9595306714375813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,16,1,power_law_1.01,2.103206443786621
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,16,1,power_law_1.01,2.1130239486694338
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,16,1,power_law_1.2,2.1202816009521483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,16,1,power_law_1.2,2.124339294433594
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,2,1,balanced,6.43180783589681
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,2,1,balanced,6.441125233968099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,2,1,power_law_1.01,7.057017517089844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,2,1,power_law_1.01,7.065676879882813
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,2,1,power_law_1.2,7.066124725341797
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,2,1,power_law_1.2,7.070527648925781
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,4,1,balanced,3.707200050354004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,4,1,balanced,3.7089920043945312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,4,1,power_law_1.01,4.052377700805664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,4,1,power_law_1.01,4.063788986206054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,4,1,power_law_1.2,4.087801742553711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,4,1,power_law_1.2,4.097983932495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,8,1,balanced,5.108298619588216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,8,1,balanced,5.116122563680013
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,8,1,power_law_1.01,5.304735946655273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,8,1,power_law_1.01,5.308211135864258
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,8,1,power_law_1.2,5.3492286682128904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,256,8,1,power_law_1.2,5.399481582641601
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,1,balanced,13.110965728759766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,1,balanced,13.113717397054037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,1,power_law_1.01,13.90936279296875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,1,power_law_1.01,13.960159301757812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,1,power_law_1.2,14.172723388671875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,1,power_law_1.2,14.204179382324218
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,128,balanced,1.875322659810384
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,128,balanced,1.8776000340779622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,128,power_law_1.01,2.15677433013916
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,128,power_law_1.01,2.180723190307617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,128,power_law_1.2,2.3832767486572264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,128,power_law_1.2,2.5072959899902343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,16,balanced,2.513754685719808
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,16,balanced,2.516826629638672
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,16,power_law_1.01,2.975724792480469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,16,power_law_1.01,3.0342016220092773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,16,power_law_1.2,3.1435968399047853
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,16,power_law_1.2,3.268166351318359
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,2,balanced,7.590735753377278
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,2,balanced,7.594218571980794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,2,power_law_1.01,8.244735717773438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,2,power_law_1.01,8.488665771484374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,2,power_law_1.2,8.448172760009765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,2,power_law_1.2,8.645145416259766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,32,balanced,2.1530346870422363
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,32,balanced,2.1558292706807456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,32,power_law_1.01,2.5083711624145506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,32,power_law_1.01,2.701356887817383
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,32,power_law_1.2,2.7795263290405274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,32,power_law_1.2,2.8463680267333986
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,4,balanced,4.700031916300456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,4,balanced,4.708373387654622
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,4,power_law_1.01,5.374380874633789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,4,power_law_1.01,5.5118976593017575
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,4,power_law_1.2,5.403257751464844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,4,power_law_1.2,5.665817642211914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,64,balanced,1.9627359708150227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,64,balanced,1.96778138478597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,64,power_law_1.01,2.251961517333984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,64,power_law_1.01,2.3393791198730467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,64,power_law_1.2,2.5348928451538084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,64,power_law_1.2,2.5473344802856444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,8,balanced,3.2424694697062173
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,8,balanced,3.2459306716918945
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,8,power_law_1.01,3.8682689666748047
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,8,power_law_1.01,3.9143489837646483
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,8,power_law_1.2,3.909312057495117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,1,8,power_law_1.2,3.966342544555664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,16,1,balanced,2.524346669514974
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,16,1,balanced,2.5277387301127114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,16,1,power_law_1.01,2.496723175048828
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,16,1,power_law_1.01,2.4996992111206056
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,16,1,power_law_1.2,2.534764862060547
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,16,1,power_law_1.2,2.5368255615234374
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,2,1,balanced,7.210490544637044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,2,1,balanced,7.219157536824544
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,2,1,power_law_1.01,7.629510498046875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,2,1,power_law_1.01,7.631014251708985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,2,1,power_law_1.2,7.724467468261719
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,2,1,power_law_1.2,7.742195129394531
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,4,1,balanced,4.308149337768555
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,4,1,balanced,4.30836804707845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,4,1,power_law_1.01,4.493913650512695
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,4,1,power_law_1.01,4.499635314941406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,4,1,power_law_1.2,4.523904037475586
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,4,1,power_law_1.2,4.532070541381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,8,1,balanced,2.7922986348470054
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,8,1,balanced,2.7938667933146157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,8,1,power_law_1.01,2.926323127746582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,8,1,power_law_1.01,2.9311807632446287
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,8,1,power_law_1.2,2.9496128082275392
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,8192,7168,2048,8,384,8,1,power_law_1.2,2.9531839370727537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,1,balanced,0.14415466785430908
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,1,balanced,0.1442400018374125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,1,power_law_1.01,0.13676799535751344
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,1,power_law_1.01,0.1369279980659485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,1,power_law_1.2,0.14006400108337402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,1,power_law_1.2,0.14044159650802612
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,128,balanced,0.05128000179926554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,128,balanced,0.05197866757710775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,128,power_law_1.01,0.04954879879951477
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,128,power_law_1.01,0.04966399967670441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,128,power_law_1.2,0.05006719827651977
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,128,power_law_1.2,0.05085440278053284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,16,balanced,0.056261335810025535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,16,balanced,0.058058664202690125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,16,power_law_1.01,0.05542399883270264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,16,power_law_1.01,0.05583360195159912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,16,power_law_1.2,0.05551360249519348
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,16,power_law_1.2,0.05608320236206055
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,2,balanced,0.13780267039934793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,2,balanced,0.13933866222699484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,2,power_law_1.01,0.13468159437179567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,2,power_law_1.01,0.13507839441299438
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,2,power_law_1.2,0.13566720485687256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,2,power_law_1.2,0.1359935998916626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,32,balanced,0.05399466554323832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,32,balanced,0.05464000006516775
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,32,power_law_1.01,0.05351679921150208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,32,power_law_1.01,0.05364480018615723
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,32,power_law_1.2,0.052716797590255736
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,32,power_law_1.2,0.0536575973033905
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,4,balanced,0.09969066580136617
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,4,balanced,0.101200004418691
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,4,power_law_1.01,0.09579520225524903
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,4,power_law_1.01,0.09705600142478943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,4,power_law_1.2,0.09486079812049866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,4,power_law_1.2,0.096806401014328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,64,balanced,0.05263466636339823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,64,balanced,0.05266133447488149
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,64,power_law_1.01,0.05053439736366272
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,64,power_law_1.01,0.05244160294532776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,64,power_law_1.2,0.050911998748779295
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,64,power_law_1.2,0.05189759731292724
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,8,balanced,0.06629866858323415
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,8,balanced,0.06809066732724507
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,8,power_law_1.01,0.06506879925727845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,8,power_law_1.01,0.066348797082901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,8,power_law_1.2,0.06396160125732422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,1,8,power_law_1.2,0.06504319906234741
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,2,1,balanced,0.10106666882832845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,2,1,balanced,0.10123200217882793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,2,1,power_law_1.01,0.09589120149612426
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,2,1,power_law_1.01,0.09624959826469422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,2,1,power_law_1.2,0.09664639830589294
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,2048,768,8,128,2,1,power_law_1.2,0.09749119877815246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,1,balanced,1.022447983423869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,1,balanced,1.0228959719340007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,1,power_law_1.01,0.8471424102783203
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,1,power_law_1.01,0.8504256248474121
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,1,power_law_1.2,0.8216704368591309
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,1,power_law_1.2,0.8241215705871582
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,128,balanced,0.09686932961146037
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,128,balanced,0.09724799791971843
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,128,power_law_1.01,0.09528319835662842
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,128,power_law_1.01,0.0953984022140503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,128,power_law_1.2,0.09512320160865784
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,128,power_law_1.2,0.09528959989547729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,16,balanced,0.1534346640110016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,16,balanced,0.1541813313961029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,16,power_law_1.01,0.14361599683761597
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,16,power_law_1.01,0.14499200582504274
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,16,power_law_1.2,0.14613120555877684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,16,power_law_1.2,0.1462656021118164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,2,balanced,0.5600053469340006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,2,balanced,0.5626879930496216
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,2,power_law_1.01,0.48216958045959474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,2,power_law_1.01,0.49704318046569823
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,2,power_law_1.2,0.4820543766021729
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,2,power_law_1.2,0.48302721977233887
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,256,balanced,0.09512533744176228
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,256,balanced,0.09587732950846355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,256,power_law_1.01,0.0930239975452423
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,256,power_law_1.01,0.09308800101280212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,256,power_law_1.2,0.0934656023979187
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,256,power_law_1.2,0.09359999895095825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,32,balanced,0.12158399820327759
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,32,balanced,0.12319999933242798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,32,power_law_1.01,0.11504000425338745
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,32,power_law_1.01,0.11900160312652588
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,32,power_law_1.2,0.1185215950012207
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,32,power_law_1.2,0.12076159715652465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,4,balanced,0.3320213357607524
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,4,balanced,0.3320639928181966
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,4,power_law_1.01,0.28248960971832277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,4,power_law_1.01,0.29788799285888673
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,4,power_law_1.2,0.28833279609680174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,4,power_law_1.2,0.2891135931015015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,64,balanced,0.10301867127418518
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,64,balanced,0.10316800077756245
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,64,power_law_1.01,0.10065280199050904
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,64,power_law_1.01,0.10115200281143188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,64,power_law_1.2,0.09995520114898682
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,64,power_law_1.2,0.1009984016418457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,8,balanced,0.21371734142303467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,8,balanced,0.21410665909449259
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,8,power_law_1.01,0.18752000331878663
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,8,power_law_1.01,0.1947711944580078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,8,power_law_1.2,0.18969600200653075
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,1,8,power_law_1.2,0.20096640586853026
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,2,1,balanced,0.5720533529917399
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,2,1,balanced,0.5721120039621989
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,2,1,power_law_1.01,0.45972480773925783
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,2,1,power_law_1.01,0.4767104148864746
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,2,1,power_law_1.2,0.4684800148010254
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,2,1,power_law_1.2,0.46927361488342284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,4,1,balanced,0.34679468472798664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,4,1,balanced,0.34851733843485516
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,4,1,power_law_1.01,0.2857919931411743
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,4,1,power_law_1.01,0.28833279609680174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,4,1,power_law_1.2,0.289190411567688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,3072,1536,8,256,4,1,power_law_1.2,0.292902398109436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,1,balanced,0.45154666900634766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,1,balanced,0.45369601249694824
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,1,power_law_1.01,0.45288958549499514
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,1,power_law_1.01,0.48033919334411623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,1,power_law_1.2,0.4551936149597168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,1,power_law_1.2,0.48239998817443847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,2,balanced,0.32499200105667114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,2,balanced,0.32653866211573285
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,2,power_law_1.01,0.3288703918457031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,2,power_law_1.01,0.33692159652709963
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,2,power_law_1.2,0.3314111948013306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,2,power_law_1.2,0.33790719509124756
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,4,balanced,0.25190399090449017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,4,balanced,0.25201600790023804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,4,power_law_1.01,0.26528000831604004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,4,power_law_1.01,0.26995201110839845
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,4,power_law_1.2,0.271616005897522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,4,power_law_1.2,0.2764352083206177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,8,balanced,0.22100265820821127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,8,balanced,0.22124266624450684
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,8,power_law_1.01,0.23328640460968017
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,8,power_law_1.01,0.24372479915618897
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,8,power_law_1.2,0.2283519983291626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,1,8,power_law_1.2,0.23381121158599855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,16,1,balanced,0.07259733478228252
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,16,1,balanced,0.07292800148328145
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,16,1,power_law_1.01,0.06876159906387329
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,16,1,power_law_1.01,0.07215999960899352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,16,1,power_law_1.2,0.07180160284042358
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,16,1,power_law_1.2,0.07455360293388366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,2,1,balanced,0.25781333446502686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,2,1,balanced,0.2579946716626485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,2,1,power_law_1.01,0.25556480884552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,2,1,power_law_1.01,0.25596160888671876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,2,1,power_law_1.2,0.25680639743804934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,2,1,power_law_1.2,0.26684160232543946
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,4,1,balanced,0.1462453305721283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,4,1,balanced,0.14666133125623068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,4,1,power_law_1.01,0.1442304015159607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,4,1,power_law_1.01,0.14481279850006104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,4,1,power_law_1.2,0.14496639966964722
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,4,1,power_law_1.2,0.15073920488357545
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,8,1,balanced,0.0886240005493164
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,8,1,balanced,0.08954667051633199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,8,1,power_law_1.01,0.08824319839477539
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,8,1,power_law_1.01,0.08844159841537476
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,8,1,power_law_1.2,0.08804479837417603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,14336,2,8,8,1,power_law_1.2,0.08880640268325805
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,1,balanced,0.700645367304484
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,1,balanced,0.7033013502756754
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,1,power_law_1.01,0.6489344120025635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,1,power_law_1.01,0.6526144027709961
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,1,power_law_1.2,0.6605504035949707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,1,power_law_1.2,0.6625792026519776
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,128,balanced,0.07526400188604991
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,128,balanced,0.07659199833869934
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,128,power_law_1.01,0.07626879811286927
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,128,power_law_1.01,0.07807360291481018
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,128,power_law_1.2,0.07596799731254578
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,128,power_law_1.2,0.07736960053443909
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,16,balanced,0.11276266972223918
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,16,balanced,0.11386133233706157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,16,power_law_1.01,0.10931839942932128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,16,power_law_1.01,0.11060479879379273
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,16,power_law_1.2,0.10957440137863159
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,16,power_law_1.2,0.11009279489517212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,2,balanced,0.398965318997701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,2,balanced,0.4007519880930583
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,2,power_law_1.01,0.35786240100860595
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,2,power_law_1.01,0.3712127923965454
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,2,power_law_1.2,0.38112640380859375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,2,power_law_1.2,0.3874111890792847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,32,balanced,0.09803199768066406
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,32,balanced,0.09914666414260864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,32,power_law_1.01,0.09583359956741333
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,32,power_law_1.01,0.09722239971160888
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,32,power_law_1.2,0.09697920083999634
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,32,power_law_1.2,0.09728639721870422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,4,balanced,0.2305226723353068
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,4,balanced,0.231605331103007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,4,power_law_1.01,0.21674880981445313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,4,power_law_1.01,0.22660479545593262
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,4,power_law_1.2,0.2246272087097168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,4,power_law_1.2,0.22652161121368408
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,64,balanced,0.08380267024040222
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,64,balanced,0.08515733480453491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,64,power_law_1.01,0.08240000009536744
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,64,power_law_1.01,0.08689919710159302
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,64,power_law_1.2,0.08273280262947083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,64,power_law_1.2,0.08487039804458618
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,8,balanced,0.16078933080037436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,8,balanced,0.16180800398190817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,8,power_law_1.01,0.15815039873123168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,8,power_law_1.01,0.15884159803390502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,8,power_law_1.2,0.1589184045791626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,1,8,power_law_1.2,0.1599552035331726
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,2,1,balanced,0.24034132560094199
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,2,1,balanced,0.2416693369547526
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,2,1,power_law_1.01,0.22870399951934814
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,2,1,power_law_1.01,0.23057920932769777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,2,1,power_law_1.2,0.23677439689636232
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,2,1,power_law_1.2,0.23792641162872313
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,4,1,balanced,0.1606666644414266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,4,1,balanced,0.16280532876650491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,4,1,power_law_1.01,0.15508480072021485
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,4,1,power_law_1.01,0.15522559881210327
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,4,1,power_law_1.2,0.15884159803390502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,1536,8,128,4,1,power_law_1.2,0.15989760160446168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,1,balanced,4.418464024861653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,1,balanced,4.420549392700195
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,1,power_law_1.01,3.797420883178711
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,1,power_law_1.01,3.8093055725097655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,1,power_law_1.2,3.780070495605469
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,1,power_law_1.2,3.8125247955322266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,128,balanced,0.2853920062383016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,128,balanced,0.2871146599451701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,128,power_law_1.01,0.2840127944946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,128,power_law_1.01,0.28412799835205077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,128,power_law_1.2,0.28257920742034914
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,128,power_law_1.2,0.28488318920135497
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,16,balanced,0.5232586860656738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,16,balanced,0.5242346525192261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,16,power_law_1.01,0.4983039855957031
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,16,power_law_1.01,0.5022272109985352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,16,power_law_1.2,0.5028927803039551
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,16,power_law_1.2,0.5154816150665283
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,2,balanced,2.343045393625895
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,2,balanced,2.3446079889933267
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,2,power_law_1.01,2.0595071792602537
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,2,power_law_1.01,2.0605184555053713
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,2,power_law_1.2,1.9977344512939452
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,2,power_law_1.2,2.074611282348633
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,256,balanced,0.2688000003496806
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,256,balanced,0.2691146731376648
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,256,power_law_1.01,0.2669248104095459
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,256,power_law_1.01,0.2680704116821289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,256,power_law_1.2,0.2687040090560913
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,256,power_law_1.2,0.2688256025314331
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,32,balanced,0.3914080063501994
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,32,balanced,0.391429344813029
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,32,power_law_1.01,0.3801471948623657
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,32,power_law_1.01,0.38553600311279296
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,32,power_law_1.2,0.3754879951477051
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,32,power_law_1.2,0.3777343988418579
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,4,balanced,1.3091253439585369
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,4,balanced,1.3106186389923096
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,4,power_law_1.01,1.1724543571472168
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,4,power_law_1.01,1.225267219543457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,4,power_law_1.2,1.1666175842285156
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,4,power_law_1.2,1.1836352348327637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,64,balanced,0.32423466444015503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,64,balanced,0.32611199220021564
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,64,power_law_1.01,0.31831040382385256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,64,power_law_1.01,0.3212032079696655
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,64,power_law_1.2,0.3185728073120117
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,64,power_law_1.2,0.3196160078048706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,8,balanced,0.7898080348968506
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,8,balanced,0.7931359608968099
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,8,power_law_1.01,0.6962175846099854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,8,power_law_1.01,0.7059519767761231
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,8,power_law_1.2,0.7334527969360352
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,4096,2688,22,512,1,8,power_law_1.2,0.7432127952575683
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,1,balanced,0.7636000315348307
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,1,balanced,0.7655946413675944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,1,power_law_1.01,0.7803840160369873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,1,power_law_1.01,0.785964822769165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,1,power_law_1.2,0.7757376194000244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,1,power_law_1.2,0.7985663890838623
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,2,balanced,0.4413333336512248
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,2,balanced,0.44223467508951825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,2,power_law_1.01,0.4745920181274414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,2,power_law_1.01,0.4824831962585449
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,2,power_law_1.2,0.4550144195556641
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,2,power_law_1.2,0.48168320655822755
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,4,balanced,0.3213760058085124
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,4,balanced,0.3250346581141154
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,4,power_law_1.01,0.3487103939056396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,4,power_law_1.01,0.36521599292755125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,4,power_law_1.2,0.349017596244812
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,4,power_law_1.2,0.3593663930892944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,8,balanced,0.271232008934021
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,8,balanced,0.2714560031890869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,8,power_law_1.01,0.28318080902099607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,8,power_law_1.01,0.2986176013946533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,8,power_law_1.2,0.29932799339294436
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,1,8,power_law_1.2,0.30001280307769773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,16,1,balanced,0.10897599657376607
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,16,1,balanced,0.11012799541155498
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,16,1,power_law_1.01,0.10709120035171509
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,16,1,power_law_1.01,0.10758399963378906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,16,1,power_law_1.2,0.10722559690475464
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,16,1,power_law_1.2,0.10750080347061157
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,2,1,balanced,0.4216906627019246
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,2,1,balanced,0.4220586617787679
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,2,1,power_law_1.01,0.4272895812988281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,2,1,power_law_1.01,0.42821760177612306
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,2,1,power_law_1.2,0.41899518966674804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,2,1,power_law_1.2,0.4202303886413574
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,32,1,balanced,0.09054932991663615
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,32,1,balanced,0.09090133508046468
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,32,1,power_law_1.01,0.08937600255012512
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,32,1,power_law_1.01,0.09004799723625183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,32,1,power_law_1.2,0.08901119828224183
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,32,1,power_law_1.2,0.08934400081634522
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,4,1,balanced,0.22924266258875528
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,4,1,balanced,0.254533330599467
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,4,1,power_law_1.01,0.22700159549713134
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,4,1,power_law_1.01,0.22764160633087158
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,4,1,power_law_1.2,0.22607998847961425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,4,1,power_law_1.2,0.22729599475860596
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,8,1,balanced,0.13321066896120706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,8,1,balanced,0.13380266229311624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,8,1,power_law_1.01,0.13131519556045532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,8,1,power_law_1.01,0.13218560218811035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,8,1,power_law_1.2,0.1304255962371826
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,16384,2,8,8,1,power_law_1.2,0.13048319816589354
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,1,balanced,2.5336106618245444
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,1,balanced,2.5350186030069985
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,1,power_law_1.01,2.0327423095703123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,1,power_law_1.01,2.0625984191894533
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,1,power_law_1.2,2.0230016708374023
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,1,power_law_1.2,2.0946176528930662
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,128,balanced,0.16080000003178915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,128,balanced,0.16124266386032104
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,128,power_law_1.01,0.1587839961051941
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,128,power_law_1.01,0.15916800498962402
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,128,power_law_1.2,0.15849599838256836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,128,power_law_1.2,0.15970560312271118
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,16,balanced,0.28864532709121704
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,16,balanced,0.2895359992980957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,16,power_law_1.01,0.26389760971069337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,16,power_law_1.01,0.27023360729217527
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,16,power_law_1.2,0.25483520030975343
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,16,power_law_1.2,0.2703423976898193
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,2,balanced,1.3302666346232097
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,2,balanced,1.330954631169637
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,2,power_law_1.01,1.107801628112793
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,2,power_law_1.01,1.1110591888427734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,2,power_law_1.2,1.0738944053649901
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,2,power_law_1.2,1.1272064208984376
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,256,balanced,0.14472533265749613
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,256,balanced,0.1477013329664866
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,256,power_law_1.01,0.14662400484085084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,256,power_law_1.01,0.15204479694366455
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,256,power_law_1.2,0.14404480457305907
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,256,power_law_1.2,0.14916479587554932
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,32,balanced,0.21421867609024048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,32,balanced,0.2151413361231486
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,32,power_law_1.01,0.20446081161499025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,32,power_law_1.01,0.20891520977020264
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,32,power_law_1.2,0.20480639934539796
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,32,power_law_1.2,0.20730879306793212
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,4,balanced,0.7403733730316162
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,4,balanced,0.7433546384175619
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,4,power_law_1.01,0.6340799808502198
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,4,power_law_1.01,0.6742911815643311
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,4,power_law_1.2,0.633843183517456
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,4,power_law_1.2,0.6641471862792969
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,64,balanced,0.17468265692392984
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,64,balanced,0.17537067333857217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,64,power_law_1.01,0.171942400932312
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,64,power_law_1.01,0.17330559492111205
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,64,power_law_1.2,0.17164160013198854
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,64,power_law_1.2,0.17365119457244874
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,8,balanced,0.4344853162765503
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,8,balanced,0.43484266599019367
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,8,power_law_1.01,0.3879040002822876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,8,power_law_1.01,0.40361599922180175
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,8,power_law_1.2,0.3825792074203491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,1,8,power_law_1.2,0.38821120262145997
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,16,1,balanced,0.3395040035247803
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,16,1,balanced,0.3398666779200236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,16,1,power_law_1.01,0.3086143970489502
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,16,1,power_law_1.01,0.31088640689849856
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,16,1,power_law_1.2,0.305132794380188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,16,1,power_law_1.2,0.30589439868927004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,2,1,balanced,1.3472426732381184
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,2,1,balanced,1.3477813402811687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,2,1,power_law_1.01,1.1040896415710448
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,2,1,power_law_1.01,1.1083200454711915
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,2,1,power_law_1.2,1.095622444152832
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,2,1,power_law_1.2,1.1189248085021972
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,4,1,balanced,0.45631468296051025
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,4,1,balanced,0.45708266894022626
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,4,1,power_law_1.01,0.36418559551239016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,4,1,power_law_1.01,0.3724479913711548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,4,1,power_law_1.2,0.3709503889083862
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,4,1,power_law_1.2,0.3767103910446167
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,8,1,balanced,0.28430400292078656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,8,1,balanced,0.2848479946454366
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,8,1,power_law_1.01,0.2443392038345337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,8,1,power_law_1.01,0.24603519439697266
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,8,1,power_law_1.2,0.24254720211029052
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2048,8,256,8,1,power_law_1.2,0.2451456069946289
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,1,balanced,2.000373363494873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,1,balanced,2.000922679901123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,1,power_law_1.01,1.7917247772216798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,1,power_law_1.01,1.822969627380371
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,1,power_law_1.2,1.8142656326293944
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,1,power_law_1.2,1.831545639038086
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,16,balanced,0.23861332734425864
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,16,balanced,0.2386666735013326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,16,power_law_1.01,0.23289599418640136
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,16,power_law_1.01,0.23313279151916505
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,16,power_law_1.2,0.23249919414520265
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,16,power_law_1.2,0.2347264051437378
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,2,balanced,1.0499733289082844
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,2,balanced,1.051103989283244
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,2,power_law_1.01,0.9231936454772949
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,2,power_law_1.01,0.9398079872131347
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,2,power_law_1.2,0.9537343978881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,2,power_law_1.2,0.9814399719238281
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,32,balanced,0.16757865746816
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,32,balanced,0.1676959991455078
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,32,power_law_1.01,0.16487040519714355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,32,power_law_1.01,0.1651520013809204
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,32,power_law_1.2,0.1669376015663147
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,32,power_law_1.2,0.1674623966217041
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,4,balanced,0.41859734058380127
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,4,balanced,0.4195626576741536
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,4,power_law_1.01,0.3846400022506714
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,4,power_law_1.01,0.393503999710083
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,4,power_law_1.2,0.3847552061080933
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,4,power_law_1.2,0.40152320861816404
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,8,balanced,0.34694401423136395
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,8,balanced,0.3479893207550049
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,8,power_law_1.01,0.32880001068115233
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,8,power_law_1.01,0.3362943887710571
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,8,power_law_1.2,0.32986879348754883
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,1,8,power_law_1.2,0.3346368074417114
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,2,1,balanced,1.0596319834391277
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,2,1,balanced,1.0596746603647869
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,2,1,power_law_1.01,0.9612095832824707
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,2,1,power_law_1.01,0.961734390258789
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,2,1,power_law_1.2,0.9671551704406738
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,2,1,power_law_1.2,0.9790399551391602
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,4,1,balanced,0.3597866694132487
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,4,1,balanced,0.35990933577219647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,4,1,power_law_1.01,0.3319040060043335
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,4,1,power_law_1.01,0.33537280559539795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,4,1,power_law_1.2,0.33924479484558107
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,6144,2560,8,160,4,1,power_law_1.2,0.34004480838775636
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,1,balanced,2.9530665079752603
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,1,balanced,2.955685297648112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,1,power_law_1.01,2.3644927978515624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,1,power_law_1.01,2.381171226501465
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,1,power_law_1.2,2.3833663940429686
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,1,power_law_1.2,2.3976831436157227
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,128,balanced,0.1853333314259847
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,128,balanced,0.18542933464050293
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,128,power_law_1.01,0.18336639404296876
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,128,power_law_1.01,0.18368639945983886
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,128,power_law_1.2,0.18401919603347777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,128,power_law_1.2,0.18408960103988647
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,16,balanced,0.32630399862925213
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,16,balanced,0.32807467381159466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,16,power_law_1.01,0.2996864080429077
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,16,power_law_1.01,0.307206392288208
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,16,power_law_1.2,0.30586240291595457
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,16,power_law_1.2,0.3068671941757202
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,2,balanced,1.5463253657023113
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,2,balanced,1.547375996907552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,2,power_law_1.01,1.2359552383422852
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,2,power_law_1.01,1.2797823905944825
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,2,power_law_1.2,1.3046719551086425
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,2,power_law_1.2,1.3101119995117188
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,256,balanced,0.17091200749079385
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,256,balanced,0.17488000790278116
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,256,power_law_1.01,0.1680896043777466
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,256,power_law_1.01,0.17479679584503174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,256,power_law_1.2,0.1689087986946106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,256,power_law_1.2,0.17149440050125123
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,32,balanced,0.23850133021672568
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,32,balanced,0.23976532618204752
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,32,power_law_1.01,0.22395520210266112
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,32,power_law_1.01,0.2355583906173706
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,32,power_law_1.2,0.22866559028625488
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,32,power_law_1.2,0.23606400489807128
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,4,balanced,0.8553173542022705
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,4,balanced,0.8560799757639567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,4,power_law_1.01,0.7408768177032471
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,4,power_law_1.01,0.7647359848022461
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,4,power_law_1.2,0.7244416236877441
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,4,power_law_1.2,0.7725056171417236
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,64,balanced,0.1973653237024943
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,64,balanced,0.19788267215092978
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,64,power_law_1.01,0.19449599981307983
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,64,power_law_1.01,0.19653120040893554
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,64,power_law_1.2,0.19411840438842773
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,64,power_law_1.2,0.19505280256271362
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,8,balanced,0.5029226541519165
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,8,balanced,0.5031520128250122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,8,power_law_1.01,0.45949440002441405
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,8,power_law_1.01,0.4615231990814209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,8,power_law_1.2,0.44774398803710935
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,1,8,power_law_1.2,0.4526080131530762
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,16,1,balanced,0.39100801944732666
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,16,1,balanced,0.39180266857147217
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,16,1,power_law_1.01,0.35459198951721194
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,16,1,power_law_1.01,0.35704960823059084
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,16,1,power_law_1.2,0.35250558853149416
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,16,1,power_law_1.2,0.3546367883682251
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,2,1,balanced,1.5706240336100261
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,2,1,balanced,1.5713653564453125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,2,1,power_law_1.01,1.2981120109558106
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,2,1,power_law_1.01,1.3010623931884766
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,2,1,power_law_1.2,1.2363712310791015
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,2,1,power_law_1.2,1.2581695556640624
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,4,1,balanced,0.533242662747701
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,4,1,balanced,0.5368426640828451
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,4,1,power_law_1.01,0.43357439041137696
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,4,1,power_law_1.01,0.4422976016998291
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,4,1,power_law_1.2,0.43566079139709474
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,4,1,power_law_1.2,0.4396671772003174
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,8,1,balanced,0.33177600304285687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,8,1,balanced,0.3326293428738912
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,8,1,power_law_1.01,0.2776959896087646
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,8,1,power_law_1.01,0.28035199642181396
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,8,1,power_law_1.2,0.2687936067581177
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,256,8,1,power_law_1.2,0.28010239601135256
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,1,balanced,4.37992000579834
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,1,balanced,4.380031903584798
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,1,power_law_1.01,3.126515197753906
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,1,power_law_1.01,3.2126720428466795
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,1,power_law_1.2,3.0944576263427734
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,1,power_law_1.2,3.155583953857422
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,128,balanced,0.23707199096679688
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,128,balanced,0.23741867144902548
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,128,power_law_1.01,0.23589119911193848
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,128,power_law_1.01,0.23600640296936035
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,128,power_law_1.2,0.23471360206604003
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,128,power_law_1.2,0.23632640838623048
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,16,balanced,0.46902934710184735
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,16,balanced,0.4699999888737996
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,16,power_law_1.01,0.410975980758667
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,16,power_law_1.01,0.425164794921875
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,16,power_law_1.2,0.43659520149230957
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,16,power_law_1.2,0.443071985244751
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,2,balanced,2.2843039830525718
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,2,balanced,2.2925599416097007
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,2,power_law_1.01,1.7111103057861328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,2,power_law_1.01,1.7255168914794923
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,2,power_law_1.2,1.7237567901611328
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,2,power_law_1.2,1.8147647857666016
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,32,balanced,0.33949867884318036
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,32,balanced,0.34095998605092365
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,32,power_law_1.01,0.3162175893783569
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,32,power_law_1.01,0.33253118991851804
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,32,power_law_1.2,0.3059776067733765
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,32,power_law_1.2,0.3255552053451538
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,4,balanced,1.250442663828532
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,4,balanced,1.2532479763031006
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,4,power_law_1.01,1.0027520179748535
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,4,power_law_1.01,1.0453503608703614
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,4,power_law_1.2,0.9127743721008301
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,4,power_law_1.2,1.022003173828125
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,64,balanced,0.26890132824579877
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,64,balanced,0.2720959981282552
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,64,power_law_1.01,0.2612799882888794
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,64,power_law_1.01,0.26403839588165284
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,64,power_law_1.2,0.2572736024856567
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,64,power_law_1.2,0.26577279567718504
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,8,balanced,0.7331519921620687
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,8,balanced,0.7340319951375326
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,8,power_law_1.01,0.6651008129119873
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,8,power_law_1.01,0.6843008041381836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,8,power_law_1.2,0.6203775882720948
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,1,8,power_law_1.2,0.7008384227752685
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,16,1,balanced,0.3204853336016337
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,16,1,balanced,0.3215893308321635
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,16,1,power_law_1.01,0.230515193939209
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,16,1,power_law_1.01,0.23285119533538817
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,16,1,power_law_1.2,0.22840960025787355
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,16,1,power_law_1.2,0.22842879295349122
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,2,1,balanced,2.3274827003479004
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,2,1,balanced,2.346346696217855
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,2,1,power_law_1.01,1.7037055969238282
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,2,1,power_law_1.01,1.715078353881836
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,2,1,power_law_1.2,1.6700223922729491
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,2,1,power_law_1.2,1.6774208068847656
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,4,1,balanced,1.3141120274861653
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,4,1,balanced,1.3147573471069336
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,4,1,power_law_1.01,0.9819711685180664
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,4,1,power_law_1.01,0.9835519790649414
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,4,1,power_law_1.2,0.9622464179992676
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,4,1,power_law_1.2,0.9660544395446777
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,8,1,balanced,0.45394134521484375
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,8,1,balanced,0.4557386636734009
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,8,1,power_law_1.01,0.3361151933670044
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,8,1,power_law_1.01,0.3379199981689453
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,8,1,power_law_1.2,0.32680959701538087
VLLM,0.19.0,NVIDIA B200,moe,vllm_fused_moe,fp8_block,96,7168,2048,8,384,8,1,power_law_1.2,0.33210880756378175
